From 11a6fcd7b2b5e31f74cdf9a5bbc54a9f20aad37b Mon Sep 17 00:00:00 2001 From: Trace2333 Date: Sun, 12 Jan 2025 17:09:56 +0800 Subject: [PATCH] =?UTF-8?q?=E6=B7=BB=E5=8A=A0dian-team=E6=8A=A5=E5=91=8A?= =?UTF-8?q?=E4=BB=A5=E5=8F=8A=E4=BB=A3=E7=A0=81=E6=97=A5=E5=BF=97?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- ...4\345\223\201\346\212\245\345\221\212.pdf" | Bin 0 -> 214525 bytes .../finetune_msrun_log/scheduler.log" | 5872 ++ .../finetune_msrun_log/worker_0.log" | 10218 ++++ .../finetune_msrun_log/worker_1.log" | 10017 ++++ .../finetune_msrun_log/worker_2.log" | 10017 ++++ .../finetune_msrun_log/worker_3.log" | 10018 ++++ ...lama3_8b_8k_800T_A2_64G_lora_dis_256.yaml" | 206 + .../730_eval_min_token_equ_1_log" | 45002 ++++++++++++++++ .../first-phase/dian-team/code/format_ms.py | 30 + .../dian-team/code/sample_script.ipynb | 610 + .../dian-team/code/test_math.ipynb | 1952 + .../dian-team/code/test_pipeline.py | 126 + 12 files changed, 94068 insertions(+) create mode 100644 "2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/1. \344\275\234\345\223\201\346\212\245\345\221\212/\350\265\233\351\201\223\344\272\214-\344\275\234\345\223\201\346\212\245\345\221\212.pdf" create mode 100644 "2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/2. \345\276\256\350\260\203\346\227\245\345\277\227\344\270\216\351\205\215\347\275\256/finetune_msrun_log/scheduler.log" create mode 100644 "2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/2. \345\276\256\350\260\203\346\227\245\345\277\227\344\270\216\351\205\215\347\275\256/finetune_msrun_log/worker_0.log" create mode 100644 "2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/2. \345\276\256\350\260\203\346\227\245\345\277\227\344\270\216\351\205\215\347\275\256/finetune_msrun_log/worker_1.log" create mode 100644 "2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/2. \345\276\256\350\260\203\346\227\245\345\277\227\344\270\216\351\205\215\347\275\256/finetune_msrun_log/worker_2.log" create mode 100644 "2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/2. \345\276\256\350\260\203\346\227\245\345\277\227\344\270\216\351\205\215\347\275\256/finetune_msrun_log/worker_3.log" create mode 100644 "2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/2. \345\276\256\350\260\203\346\227\245\345\277\227\344\270\216\351\205\215\347\275\256/run_llama3_8b_8k_800T_A2_64G_lora_dis_256.yaml" create mode 100644 "2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/4. \345\216\237\346\234\211\350\203\275\345\212\233\346\265\213\350\257\204\346\227\245\345\277\227/730_eval_min_token_equ_1_log" create mode 100644 2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/code/format_ms.py create mode 100644 2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/code/sample_script.ipynb create mode 100644 2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/code/test_math.ipynb create mode 100644 2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/code/test_pipeline.py diff --git "a/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/1. \344\275\234\345\223\201\346\212\245\345\221\212/\350\265\233\351\201\223\344\272\214-\344\275\234\345\223\201\346\212\245\345\221\212.pdf" "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/1. \344\275\234\345\223\201\346\212\245\345\221\212/\350\265\233\351\201\223\344\272\214-\344\275\234\345\223\201\346\212\245\345\221\212.pdf" new file mode 100644 index 0000000000000000000000000000000000000000..895bf2ec1c407f97feb67a3a0a43f22031036968 GIT binary patch literal 214525 zcmdSAQ7$9*2>oMW~& zMnrr)dh{NHL|#~whJlvt8_E8`%)&PYW=4E^d^Ju*7Y=rBO+^Ms`B=;l_M>q9=E51bM7%RCV@zcE8sHw_K{! z|GQs-hZF4_ay_lcjid3qo*&2ionEY8klXuMyEsqF_j@1yr^j%=&kwhe$J+}%IKGc* zyx*^U;NEOp&pX6nIKPi>y`JxJ^o^QV7nQ1AhlleV-x;-cwX$N#E*ipmk|@Ggppmih z_;7taVa4!b@qPm($EznqD#qdQ;cfG*<;CIsM#>!A9`qWlY6pPf`+Rx6z7w*#4g3AN zu(RFucDA>$^ZQAT4$tqUrw4C`$Ismt7H@oEW+cy#m$%z5P-mkEw?E{ZL5Bf+DuI6b-u)yXWg4M!t4lWuj=^^XhVeJfEBuSj}6=|(9&ep zf*qHlzEGIeU!HEUUBFETq2~M6hQf&iGSP< zZ|g0Dgv=^>S8AF|b@;)0#%jQw*e%KK-d^onr7~G4KZx0BDWl*vM&?>&$#wV76aAzT zg>TdFl(9D0@krIhd;cK&C8Af?UiqqdArYA5AAk zv#0;5obYt(Hu~%)L7WW<(eD7ZOppIEb2S!x0L3k$Nz&Us=pOEE8LYlqoD?Dt9_V*q zZvag#fZmCK*q4t3!k$-~r^Jk5NMeV-K8ntOPd(6^qR&vAKE}6ZZA6OB3+l;r@Kn3` zYj~C`MAMKjMZe0<>{|>vWT<*$i_{2A0gRrR<##}R`Ub4mr-i;OK{>i-=SXo*--p>v zkOc&EVm0e{HX{!!{AeZ)%1U_DLU25iRieuLpm}3YE4gWR!!3P?ejw_pazpHXfTz|y zdLStpEDd~Ulhl++{Ar?yeXQ8xcSrfFY=ZI){4Tz5xP<2)U|{fb+rw87`<^9pw7~$C z3)9HJ;kcMBuPyLAk8Hs~09eIvs=yFs`2ixN03yl>SwiO1Oh@T2_&od+9iwMIIrVCq9ny z*8_E3UQ6WsU2sQF^OIu0tG>sQ@pHii!KsHDH|%3@k9E9&$^BII?6XPvw9k`VSUi;^!;mZKkdB*o6ltpm zKUQeL8XB|J3y!(f)*zG;)1a18sKojhz}wE0%>feHO$ZJiZb6A)A*!?3yvH@<%|4+Qoe|O7^_;_7=Mo8csB%pynLURxJao-rk@sT}m5A zQ}NN7mR4n_xwA8*x#Q8^<`*J2Esv2~ZcKG6F`tvq0WD;Vwu>N9Hc+hUR_~c+ zE|CWGB7+61r>9fyfQ(Yqxe6tqTf#96Z-kPhS03@pbWO~7^49A}0b)0v^1g_ZQ1J~#FJ)b0g(iOt%kCf1p-rdhNi+qr|0QLg2csQ=IH zg_OmsgSY&xRYu9Wb)FjF3h?Pqnt^yTFBObeZ2h@_*s`)a4L}JWHpWx!*YP2UFC;Nl>r)t zN1bJXCyD~!iXTMJT7|JI;6!J}49FN;I}L}5vJ{3KW)B}M-{@u>Xb9bw@PWg2rL4R# zqoP{1k+^aLYHEa5Qg7~6CVILk?|s%rmllUBBE`4cjQnZ&TFAu8l-a()^nuFub>uF> zrbpjUxUWc2LL4B1^E1fBcC{%$1&~dC7YqEA3E8<|`Srv3x6&s;Nr1+pZ$ZHOq#}Va z$lj;GgwYqA03wT;6A3|a!az;Iat}DoRROuWw`D0rKLldBbPL)6(3!k?K#~Ip9cwYp&E(WMfs0jyC_p+qExP%PY=Afhng6Me6+yM|G z=I)wI1T?Q9t~(V(Pa#gW!cSCKE}&q(@NY!YNw^lSc<3$k3nZ+dKq5S^q(B`)+YS$a zfE!9?ZW%firZvo_?zSDUqaj8R+z0&vE5H?`iysO^YuDsHIuNXhSJhecT4?s0yD&7NEg(?GIp;8y=z$6#AwbRK9O&)bz{QwxM>{)pZuxwfPj}HLj7YT-G zGpAOzm5(lKr9log{v0wjSMEjkjvXMbDk;z)G%n>D1Ej8J8`asT17AW#E>F`dmh=C` z7!wUUK1xE|$JDCuir~rL=LIQ2E+&LdLTrG5DMLj7N!8cv2`P~t`^YLOPKe7a-LDoA zAFZM-$R42t@qG`qT~l030q;x+StgE_lES@y{~Jf)UZy=O=-zBC+FsFW%5kfD{-`Lm zit(tb&khixgAr0>f8_m#a&yMGxRb@mw9Pq)1ClXT$P6d}#JU?qI~#~7VE@}O;#mZ? zVXaH1;ob%Xy&$^h{Z(`+0Qi;oEFiE)zKyZ~uh^zy`;N~*zV1&12D4Ird#i!s0WXvW9zPj>j_fHkziVV$yQKxpokQ3hm4N%BP z4x&tX?!$B;2Q3jYNm}fY@Ll#zf-*&Q;l$EfaSMPJrOf^Ob!KP_EL4glqdM{h?0GEI_vPAfctpHj0|ee1GPPGpUf-uXeu*zgKcl-UC4iL)kb@4Xa}Wch83 z^Q5fVYM3B=Ep1}2f-2Sx$+##5HoQph@?CBP2pE0Hmt|hF|$AT8l+a`D$3<@eV0xx3sv2JCRd;CMd&G16M_s8#*!dYaU9A^ ztMx@7!i6zN24i0{x6BF_9iwZS7cT~GQ2yHEO(`s!OOa&Em2}F$EjfsEG=Z5UGGUpN zGSQ2?7)R9L9XHg7HQaiFi3=y{xIHcPp;bCP_&$3wX`ACgHhtkXE8HMQ+ii(AQztCRJ3nqKv1QV2Ek@54gy|-0o6z;n!NxT!d z%sCPZi?+8>lhi(B(z@d<({)GF^5q)~@xL zmM+dxVP_@8alzb6``Ko1bmt-_Yffiza!Ym*NyhV=q{`R@ zFt-rg&w4aJ9XQ*xr}b$;aju|nHC95KwkBFf>sFT_tnQ?^u7WYewEkc7H!2%iUiQsh zcC0pA^+=9uP*}_D=LdMUN3Zg|+&E83Wq|#)u9r6`N6U1aKom}W=$=kMKXFU6!|~`+ z91o6ff3;=WaGR(X9bgtdJsg+YWLG?bs`a@iJ33$E(XIPZ2MtCO8PvEy}JT|aDuca)?T|CGV2AnF-pjUO}z1`&nptDZ$gb*R)M?3Ol zs;WuyxerPU$aCcpPYS6|Fk0{uH7=bA6GL23;HKtKr3gpaDI-2j2sAmhk%%k1RpX!4 zod@XbMMnuD+#u#}Mi+wUe?%iELFXr2Dsnc6&b2*q@eRVYb!EGw>3=x0@$sqrXU1_BRIujhK`vu zZ2fI6gLY369>xyBF;C5<_@W)GRyGqJFvttnjfn{psPm=YG}?DK$$lu?U6s!@p}n7BIi|h|HVQ>2|jF! zx5;`nw`5{q&&R~FLFD|KHFFEWle=-Sl#+{Fq6bv^iI_cN&P(BE%g0(RNlXhH`>9@=9Ox?=F&N~U z#wZ@G?u{iZgiI46mv-2|L*Lhjc!pakJXr9kvyil%vN+XX?D#}WM}D#`Vt%iiF5b0u zznC;=Ei*h{V2#bIQ7n&brDUM1akFJNbRCd93cYfEdA0dw+xFOQfX}wfb+P5gLbn{| z4SNwfwDZ~?J90k((Uq{Sv3>H<9<#_A^LgEw&`y2k!RMZv)^+P>-=oGjSm)(Oy^+?^ z$HRMCq$HL3TH@+s_o-;%JS2d zv0!jx$=ILALrje|M(sKSI$rnpod$r@AdgnwhLS7#OZxakq%{ZBtkf0!q49u*ziP?| zIz?9Z7RW(tcMs@(hVmOP49L7AJ3_6^ssD3?s#GfoQ2rs{`Zb_7MQLEoo`J|lGX{Tg zbZ_(KFbOwihRIjiF=qnl>zWqb6n%Kh?;`7|S@3-sz`(Y@a z^cyYa!v2YSSy+PJI2yc6<(;Qc^XljBuwu%`m*x#(TlA~9=HyD_eUGO|2snAtwSBCJ z!;i07@0(uEz*froN;;!$Sv`&le5I+iHi{sn4$?tkVJqeuBvoZub4?}+R0R%~Rmj@X zIIebrWRrKyB)nFWkAoaz6%91p!(v*k4q)rvEOG@GwkFDe>19EHN>Q0h%GsP}mG}y4 zuk`$K|K?(933^Rcyh!ntOSt3euZ;zO)^CP0{xef->H`&F)^F1Qma{7u0KuS&PcW^d zeL0Bv*{%GJIY8|y!$|JMfYde4{0AG?u!hu?k=AT5vcT%P0tGlri--h9WuV8b^#C?v zf>*4g8eai}mj-SL;i~d`HG~To;Ch%a(e|^&EwuZMAAWL$GM{l0gYKz4qs0m$GNZ+n zjy&VV&pemw76swQeM5;L>bdP#=yC1wJu-acJ{C2h=sOPGfWlxkz!ybo9^K;HG_!bW zLFVx+tCvx^rEa2AN8wSqUNIQ2NcgDhFQk0Bpr@)h>M%(^TPp7`QRiNYmFXnxw|r~w zZiCuL0w~~POJjHl#Il0f*VWiK2Lr6ih^|mIAeF4>DAdaWYmmf3xL3x?Htb=QO-*Js zLM>Z;?@9tdbkEsZ;}V$GX1>2I_3owVNH|e>%X*~G8{?VWa4ltJI;6z_vZHKxXK4$# zfclLG)q^Jy>_vh=yS27eg$0F;t_XwLbsp}$Lk=*9P{~t;7vt3p*9+=N5v{^h?nnu# z-GRsU97aHOxpvC}mSzVxVg+DL<1NBxr?DHf?N#g!ytcGZ?Y%Ya96<{LFxHIKr`OQ2 z*D(q!%{NZ}5eqO3;JmHzn|7e(1t;KW1_By26$NwNFl6|E{n%Qqhv>F3*|a!2HyjE^}PU6P(VW)+}KcmANRY^4qRGHp+t zFSPR+YK~``w3&S|wwbYGh2la$+H;otc}RDuvt68Pkz%zb9ekZxP_%qly{6f1`BapT zAB~O9`+A>`Zy2#+a**Yw$S*LKSit)qJ&-J)Ks(U$FQ4A`gr3{Ntt=;0;n^**Di_Yn z=Fhe?VV>FxYOI;}J)r$hHa1-KPZT~VagneIrx+@&OR0*`&rS?Ipjw*g5q4Dm)o^#o z^2oz_sy8A1k0RtY1q`7#%ttEvmTo!MD)wGo8{^Ke=PcRZ;7|HdtaLQiJ*?E-1BZUP zBv?L6HXC6oZPD(`*^FGPZXP@ArUsNz2Yyy?rN%xPa2WS)d9cFxx(96(UZTZncyDMf z?6o;9dBvyGX>s<d%8BLYi7nfk+XkBLRfIi7S;BT|OoU6b&IR3h!v9?%%q>N)BC21VoKMB$$K!5{5_@ zEhVbCJ~SMv2$TZlnsOhVd^#Puh0B6Z{x z2r(p%QIdu^oe@kCpEswm)!RK3?~|tSS4-8j56gE>DJzWdtQr>9hlv>Ejh|2_1`VQ( zga}TVEGG3txtt2Y%%C_5uf=9!@U5lYfcWGg=`mmwG?En_fEO#hT6Krk7)+)4EDv?F zCDIQrH4jn+4PH9bR-jCx*;W#gM%oh8XHG$OHz(-#f0Y;3KmcK0YMeW_o*3(&OiXzs zfQka>zO4gtG(X7_4(}P{i03^TvGU|i)BbC8jArxfoFOwC+M;0Wxr3N^A}%aLKr0p3#3V)O_86_ElV-e+5s(4l?!bM5f&n z3E;=f!+9-GFM4*P%nSLlAicBQK;`WZpnm`RE%q@0EcnBuIKv_kA|jkP{dX7c9_+zW zE^%(5n`sNQ`4N(lk#13VF@Z4}B2(w>HtMxNAIMVLqy#s^7fs?^G+ z$1S!)&kQZU(>MGkulSB1@toe`+CD}$KR>3g{Mg@f8I4Yu45mTXOCr+pj%RayKaOrk z4t7%Mgx_Ntu)VPdx<T>iw!z48GJ{jy zB{@=-5yiwZZ-w>n+6{v34w%`+&u3ke=ho!weera`sd@!lqLpq}@SLi(qQ9jR23yD; zY-b#@M3}8ctOr!W>JPyl6|R~|(SJX*_v1n*C>xERv`Va`2V6a%NY{=fGwLPLSLOhm zv0j4O;BM^G%XHn?C}%%oac$HATE)q~Rb|O<(VuPsh!cQsCJTJ(b+F!tb`&5oa}Vmf z8m!?211H8gxoRqeA|0ZCWa7OdfAq?I=8=01?Oy4ee`3|uckTg@27Ij9R6^c84gr-! z#$}ozgAlEo_U|aEJ%DVzUd{NyN$Vy0YbpWAJ^jZg>HcZ>R#1xj=QA}G((C7R6SC04 zIi!2Dk^PUW>>p}6eAiWNaV`M}K50eQ%surZ&cjB6K6LdNtz#Ki3VAte z50Y)ebrG#=)Oa-v=JRI}cuaCn&Avg0q?S+3M^En3++6}C=PHBMh;BiWS7UkdbQ?Ge zCzT|9-VW37X>_yP@gv=j^Ec-AErxZ6TSlKaS3W(sw{VCM)e9-Rx0whb6&dSjX~7NVlLj(J8uT_ z$KcYt4ol7NVN4wiicS+gz8Jq`MEiAX!YmyN0bgUq6&T`kGzP_M|-HY-Nvh z>CNAF{xod*NH}^;IBHKm@|0O0H|m2CkIFA4STAklT3squVd3;@=sI}!wu=3EzW`I^ z@pI;;rbU%Cna@1w#gBv1!2HV#{BLXTzgmlj7BgeEiF>GTDCa6h{;v#k1ik2pBX-8juP!b9KWy0 zKGG@X0`pGAH=vU7Ye#A)aX#QvHX3Ev4YV5UXdK1CwQsnM=igwkMUTFdvKKha94gwf zhic5TS=AUIL5@i^Fr4^0R($CF6KE52y zsu4P>pj-y)-6vta6u7+^4ulO?aW6M{oA!Ccs(TFcZhp^7-)(@9O#KnGF-eHSICu}8zBLeBHn+94I0!zTmgKivOcIonJO?EilM zGKvz3UnSge|IIJIf_{6KCnIyb;Qsf8xU*bhR&PBuRO1t^j`b*m&v-el(vg_f-sddK zk&6Hu$42i9RGqhPx|vt=TnAIvpw?eU*x(GLSH1z-`yr{`vL}BnMwz{xF|J} z%r#dtxtyz`LBs5ce2xe4C?7{JA7!y$T3Nx-xDff*n!~i6&Wp=oML!L|i-iK!!m6Z9Y zy*c21KreH#7jR9FihMA7jWE%^hkx=`Dnj&asFa_3lEzxSC03|Kf#=B@*`XH1KIL>)Icck3~YxoYCz9+rjc`7vcoqfvC(0 znhINX{g=Dgsn#rdG|t|wid%$R)Ds_jL5w^+0sldKqHeKY3KGy%vr$Eo?Y^gUZcoI_ z5|MI7nitj)^RzA{^n9$iy8^^+S`@zdFTR+oSYP=aMtEHoi=P1~((t~&8xKhL#8Mf! zNH(*XswcADTx`cS9$UsOAqkqM$i`V(0*CjnBDY_rn!5C?Qe5=@BXUgi?0*$Gra$mU zC%(^efF3&Z#`haehmb?2fJGmAvvmk|bBd`Kz=$g2fFafp$KjP(M@bNl^+VBbq@Ka7 z#}XG-Aiks(98vU2rr-uWaiRxy%@J1?^oj$S6g@dg`rKXH93t5&EN&zqe?3LF*v9_j zv1eR7^xybF##<0sHKkJRT7u7gkUGJU5|ChF%x5woZY%`1fi_x6udLM@gYO)?EB^9m zT^*%!+q>AwqKdY{q~(%<>^a0jW}m;#spjBbwGfcv);u=(dd8LUB)2Z1+?);}Jtn-E zyWmTdkB~`ZVGVJ%Yf!vLm3@0!PVJNaAzFXcu>Z%RH52_`HCJYaKcGTIQK}k?0ea&N zxt$-thkAlnE|M^+^UY3bJ*o4|5+Z6}9#KX`ghUXRNm{jiF_~}K(#0d%I5hZ8#glCfs@5pdK0?y$nw=XnV?h5g8l^H) zkJIZ}$v)%;1KObu!A@AD0_VUG@{o1_VW=QchzwLCfeP*zBqz-0nHz>?h1%jUC6e# z@YSLtur;Fn6%4Art8DHNHN*aM5Q;3XCKg3T7I&C#tsAg=Xt-NL=9{~B&5&&FlQq@9 z`w}+jgzWoDqAwE-Tm`w)x7vadI++e&aepgwmOOD5d>ee5OTviT?;&y^?IuXn$)G(1 z6?40Wb0cwMd)S}YXMnWQrFswK!3@v4(O9YYu=x$Z+}}v`59Rq+Fv!I62cOhQ60rR` z%pfs|i%}(R89TqsSD7Sqp(X89 zHLE{6?UMJBwC*8yuH>O!F(bkiy_IzDA!3VO{QCM}#MHHjryclII$%TVE~FSFM!W*_pV!!&t6E_?Lp5!qNs}~kMrRhN&XEUzvdFGDJB{9H z%%O*2YhO5<1~=B;@UZ7Z$%JGGo#`Eg_cqvUn9s{-Hy^%aJ!^CK^WJZ*i*m#y zrF{!(1ga`9-+Rl+v7fyZSUouKK|j&l?1!-?W4CGVOIxpV3gx4tjZq7#q2xk%A7e_1VU$(^7h+e@(}H(_BDZv5mR zcr~*7S+(N~+~mY6`43O=SACa>^$*^xqqt!+NDuusgRI%>Z^FYfgCfE=57_QAR%|}& ziyccA#T}VA&0!L0gJDDBm9m)1#*>;AT|$z_2Hlw*cEs0;b!+RcUjwi>&v$Ek`yNDF z_VyC6F53#BR06c)o3(iKlM@kT=Mr+!bf%&}<}%P_;;J(itpQTt!jG-W zKDxoPJ{L*Caszb6JtJ!AU!D)-xbIKYkxYFGRskSWlJT`&bD8)eQ(jr{V%kNfkz8RG z!RS+$nSgTyIp|BLvt$8!3t@K%(&!ig00XtP*~YH#z4zwdsP?UtrUUK+M0NY{>B}Vh z>_aM9qpYCF4r^9vqc(zP870!iHp^&SXxaemW3Rc#_QUF9So+*|8@1 zyp(sgg)h?l!^4OlT-umyA2Nw(5I6&K47T6UQpox9nfwRfRDzfZHeiln{5IZfy_@7F zA_^7!U}$wkj(_9@fK%OCG@^EvX6Q*v!eT4D^jQqFHNa_3|A2^?5f^=_xZ}nMsE{d0 zas{_tt}wISm(Y^E^kxJ$ceH5;HxMtEY1$PQTv`~p!RN{?`AC>StElN0JZo~3*KCfqXL;V z&p&-ndhQN5lZz~1Fu}N>K+Ht750v9UI=xE5#5FazwFh+n>HIA3!=0RN-UkWg+~Lqy z`?XFSY%Mz7(C2cN>Coqr3R)OC?`>)C5}(QbLpK2_t^l;(pxYrpEo>iXW!1S#dkM=H z<-6H){7YQZ_^++=KtA`>Ps(2>ulW>wV`6Qapudt}c~O?jR9yV_V31YR|8r_%V*D!% zWMuhcDPAXj#xj^5e)z^ClEW5GYSGd{Aoz+lFzmCS84f;a4$KnKko);DXYgxkBYqFf zxXFs!JGq|6!13?#qVj^Kw=CkOb^V2C&?|wJik9C9y+Zlnh#KpF__Tp&e?4igp#yvi zcTU@9XU|T-wTp9Lr(3XM8aS}h_Pt#%=dBMz#y^?`h8%nBOr%wff#{Z)%QfksKEVlpQ)_SGS`7JRXdH zr@j11BEHzXEhq!T#tcO(e=z_-uZOOR3q#lMW>?XVsz8W4aIuqY#vv_H4{^H`X^#b~ zmI(-&mrlf~y5(fY2XC7)9mdM$&T3ws4M#l{{yW(**v=f9h$kXX!|Oia$B$%Vp|ZQ0 z#kOwn&*WqWJ-n6r%92K6rAD$@)0@-Cvtv<|4EdtG zbuf}M3z2H8$&=lf?7v6xQ0uaJl@y9>s1B-Oy1nY7^K&;h9mET9Cd%^(Fz6Nah&zaQ z16gfFV^WWXb*xLnJ;7=>9kbS=7xx?Ivs_?DYin$h15G69PNALL_X3ec_um;b&Sd<` zeg^a19HT6am-AkavcBNfYb}x(g#=-EEFI0GMxT891zNHhNc0cs`72$9iS5sBp(y1j zL;$_v^i6MfY8Q?*n=D5bZS12Z1wYRoc$#hhAyZy;*q^Nrm}nx$>0)Vyyd-WL%6@w>Ar7t4KI9TX5!?eqKBU&k=nJ_-wcOs7QV^)k zJ`w#v5sFp}&vmHobcFabFx(ymwo!L*u$%$4R|DTIyszdQ%|v$yD0?EU*#dL$`xMesRTqz`b_>WQJ4)(i#I(Smf zRU$IaC)yAoeL80~>N@*q6!mlvr~w^V+o-;IfS?*fw&nc$N=60}!J5NGdQVE5?YF1c z;1}-}J#N!<_oIIxGH2QjT{pP>Io%n!-!58ndV@PC!S+ zrW=`*^-qNc$pMxN%A+Sgj!D>U)5%QU!|gAIeL)_Xy+YHSK*0ozjTxn09c1C!&G0u1 zFP&qeR)nw#n`e*4__>Rkk)qrl$B4i6W) z71S>U!XNO0F7NwLe$>O~1_4u0ixFXDA^8P|SnNXz53i$8#P9QS@wFV<-)bEQxE`vF ze!Dikuo5Cp2UG;LBg&tZqn`-gsXHwtgS}fRYRUvTE4@l;y&Q!RhJ{j5L+s?5h_R7e z#N%=7X3Ol6A``(gh9+porV3S>hP&*3*}@8|b5is)(+VZjoT)o&$anaIro7IDL{9c$V7f&grU-o4^1*)qUNxsAAtrU2%n4r3YI3$o9-Ww46BhK=yH2 zhd6FbUjjh=3KoEUY9rbz$kT*j8p^aM3vdBF=#iBPXsQ`ZCn`fE; zw-*{L*D5-ea>22DLgg*7udoKMo~STUtgd5fQzoDVOSub5hd?kj=TF^EKtB11)7?lC zLOtxeyAx_DfXHR=_hO5u!PR3lMi7{yPa+_`9qk{pPufeo?*eacH~x%Be(|lco56^( z_=m*(-PpzU$HdALFAxjD00DgC5yA&g0gu1O!=rgs@br6yB`1SJxGs8JbQB#J81>YP za~@~nE-{s9F6Q+{+^ug*`+&+OKMZ^m#0SB7A<2;?s-=@6&tdoO8@(3Uq2*l+m5K{U zc-N7%&Fmj zF;QD+TAg$aG+v1p77wn|_Owf#@d^}JK`6?6(7CNu20%(x4B#A|Zjf`xEKuNpLf}9d z4q9l`S{x%$2PIAk1Ncews%&pQVwAY3#I>a-c6um*hUxZvpoDeR1Lb4D!K16sE6?y3 z@I+giq>6l$H-F+;s4@)jig#F52j@1vh@bHX@J;X!H4SFhtaU{At8DzlAbkgO_6nC1 zg(nVtU4#368=v@WEEHClxcUGYn&wlFnV$kdZ zj!85MxTd91oH@a5?9gS%8fA8ml-wMWGLxr8D&k&E8(m4wfn2+s9dj;3B=c)_@?uwy z>5EF4Z0A=dm_;oqFOw5SteR%}&ewL*$4eL);{1yek}ar|>b$jpiiqQbytH5d&U-Br zKgWpEq4PNJRti3jKcRA_r!XfPZZ>I+i`I8q)n{T1S9#VvEFw)OEx^e%aa$Vj-+V&S z*p<(B?qFV18f^ZfaG6>Eidz4V6{?w8|7y}^V*NwOR8f?G-K2-^ctd&h2ehgq?lFrj z414&!l9-!;+C?0Vqd-ieV>Onj&bT2o&6`Nc=Zw9>h?3VMmNwSNuDHke@uL`c(843; zA+c?WSP0M%c-Qfy@2D-!e+KJkp4s8DAHB))x3MjNwZxZ%pO_s_SiJtz7l~WLKxsO7 z-7EGRdfiYvFfZ@@?zgWJx$wFGvPD|=!A)-D|XkG!)Cw~X4q}oam zjIxrTf{K+wGcI3m`W(B#=m}-$YZOeMbTGx46S_DpQ(hT&g}JuGR2367AsA;8wM?#u zgZW+3u_+;tvAg{!IwQgiUD)s$L<|P~8i*2}E1q*tSFReH_rz=nKh`>z-L@aItvr!L zY8Qbeffi(KoQ_yBs=?Y!bRGBrI%R}Z9k3${dx8ZO=D5(|elOdAROKzfpnScg`SgJ~ z=b@ngzA!u4#^e@?zRZn`VyDH1+*G`4#|wRN@(kQJ5X1GKHOKZ>nkEzLpXNfM%oksR z2!7%KMGH5c%;T7;D5w1rN4O4zAl>~LIEUj2svT*W&Xgh3=y)WxWUnZC;8exW zK#ZjxLrH3gF8Z+Hf?-PGK!V!OX%N6>L5j0+I?;`kC>-01x#Jlz3pAC}g~~mqPJn+z z;xnj@xip^fO{(|i+y-P{w1++Sa`jPv?$IzX%8?dx4Vod|Ro$LcVi&@SrOq#ec&b>7+W;!K z&c8m8BrTuF7k3>syA~42S&j&;kXj`&J^?SW7HV{AKmwVqZ6kEK6cAXvunD~R}n?#f_gE4KTXr?;Pu5C|vaH1I>U4MCR zZs5+#yn10ZS=p)bre2LxxUCB@xtF+BS%pcSc7Eo|Pj}$LYRN4BkgR{buKwR|u>YU; z4w%^g7*2E&rDQ=EpoO1&zUk$Y_#vHe;}06P{!T471_PWIzvpb8kXS1%FH9tTvQA@B zTtD2Zw#A)FuA$O>b}vMHwVv+9yZa6!ErxbJP-^r84OG#+j951`-tVC7t@RG)G4Yb#f-jJ31vJI zwKPFJ$w3(Ax|}+Uo_!a1W?SEefEqp6gQ}|2dd|3MbL@aW7Kor(kKvkSeJ{GtrIBq_ zAcuT5-4H2Wjvq|y8xHh%9td*wdm2Qq>nc;^){U4?9ID7G>CXAd6MM5 zWeEX#+4^+bjAXyV5dfO>!+c!lE(LYsosZPs7x)frWL5UaE99KkN)>Rit^+<-$*#liA!1~c3~`v7?$5z^ zmw_ebvn9~Dm;EFGoR!~mnv`cOxaAY%>`wI%zbA4>b z3SQ(-MS3fxai$d%11AWXj2}C-o zr(#0h%io4wI~tW^{P2#^d*}>D_5bmU@5hB;x%uf)PPUiDWn6-Txi@b-iDzCKI?8_3 z^xh3bl}PA8WilMBP;JW(5_@W|i6++|z&Hp_tSS zZ5(e$=lE>X-R7wafL9A#;j+y**zd4(NAKY2pPMII9m?MooY!)m->4@p(5|!UcSE(@ zG(P%I)%sx0ZmxDiJMgnQ_h@g+^je`ZSLim;%=%z>mO~(nfeC-!$=;Gzz4T-ZUM+{| zhD+gwCbaIgOvfLyS5^IVcE+b}4B4YWsZj?H!O??rNwXzqV_y5H^79t$^+2ByJ>jN4 zwWm?IhMAPz*nErw(u+5Rmz)?7tOSc|R~JfC;JA>YZ3=pvovnCa%gLIruOGuIZ%PhJ zSM3%ix8Rj_jR6cj^4s>ub!s+DmASRVJ)A!5V6b>0O( zF#~E4=dpjz;h51n4RrHFl}CuDN(;<~gOqo%c%sVS8m-n=Ls&f>LNk9h|LkC2a_6gK zW$irl1hrY}x%nSaWMTO$PRPjg=aNtSl;ziwPskJRkd7=`kVLv5xUl&Nc>O7y%o~8H zouWaZqY7sQ#=uA z?rTLyy_{TPB)YfvYPXU8EkqB&&!etP-EhT<`bb4Gv^vfhlzDnBFaNNt!ou=b zQp^9?8Gwc5uM`Jn`adjEnWQhg``2ouCn%nM3P1j=SN#{>eJKt(2}$f^ZW6t{_*OSM z?ZIOTxb*-SKZ~Zs#tga+Z~D<4S#=&|I(ctK8+fu@)0~MJ0PIE9xvqhk02y9k!U%3R zLA&kK+?yd%h-l>9cg+vhhOv9sOxW{1$LV{(JeZvpsg(vb=wp5OuSU}iGt?5qCVtV1 zWy&7WJcX=$G_-XK>Py0@E5u8;7f}XL;)>YlA{IJyT+f3HQ7a9Sj zP(((=^4Fr4M%Wf!C}n1~Qzi{Rl9`X8={{ZO$>(*OCD4)gd^l6|Spi zWG?BmLBUZHGsO$0h_LR}H8~GCdjZ-YW2OZ^M7cikrM?6&?X^61z^lo8SF~Hd2CYap zCyA-ykNiXtQy2B=d}VQUx(8xH?X0yg#YVnfS;g8UvS#_T_IjH=&jtR|6^&+aJkQNs@{UrvKuf*@S5Pj)o%=(*x#?}%$ zIdE#1#x}2JQ>Bq1J_&~(8XZwx^BvH3$?st`$o?@e8dR6jU*ln+yd^AmOOM!)u2=zX z*_ayMu31JQtQ-oDKk`#JmL#Ig2S6nOb-f{rbY&K9GB7VjLaeffwgVL>Jqq_g;2`lP z)P>Tk3ztVA9BbMf=e3`D@hFDLw7vSl%WXu~XD_}`>4e1}o9PmsUH3#V(3wI1+`Gsz zr=rV&+K|nUsF8aB*L;-*XBo;!i+JFMrG#C$mt~g&-V|hUo}PL#2<7%>qvGyH9knIW zZqse3Zf1<(JEQllZl!b{!;Ll3_Q7&s`@8M$l)(;?|484LV)QrT10&NP+W6Pn;J@}) zgm1iua2JGv50c;@C?qY%!dMlyya7U+qLhI(4}yMo^A{?Q0}h%WSA`yZzux4)3eX$7 zz$J=a#^@iaDMkRxt~3h6j9$7c7_TxzL6@`dp+PvAj>&}t?CnYH5MI}JWA^Q38>ah$ z;w*hPu3r*QRuDbxMgI$m(@A}P+?JVsL9vh77Zf+kP5SM7K|#38g?V9J!O#j=5Fe2m z7nT!;H>W`7c-)P z=^ujiSH$gqED$p@{gsNy^#8E;m0?+L+rD&ncX#vBAT8Y`-7VeS-Hjk2-7Q_x4bt79 zbV{RmU)J8|p6$~6Tt2Sz-23r5Uzz@a(AII&CkNsa$sQSY5q)rQ z49gWxo``#2icw-P#~0%}Wdw%hv11Q^_uQLx*SHT`Ap;oJvEpy*6;lfu5*_n8>Lsb( zt7Fhm72=9V_7JRQcAO4RNB2yjVJ72$J%+~!@|TBdP_IjDLXHrKrpFLtZMk9C^>piJ z>b!sd%B*uJXa$ad@R*-)Zy@+%TmnL+Wwe!N)???Mw1syxB>4ZJ7hw=U9}H^_h{CwL{_9?`ETSAiTKtPBTGm0kL_uxpwo5Ebyw z7&1?S7D+MBFZm1Fj)*!-tZO7rnL}$)juN17=WY=hQEWvU| zFT;VjbMJaDGUTz9dI(>9L%(6eUZKD_Qi+C*xdg0OJn${%rQ~>RbeDIZNcOg-HC+_y zZeVgqbQ824-}9s%dwF~2AQWE0f|uT_dtYF8@zuH)VZ2-i0J(1{aV_9` zHmr8r2okIr>zDBbMbaOLO0B&XO=MxvWi!K_+-oE`_Pi1-Lgs*r-a$Vla&F3i619_j zto~_^Tnb^UZIJp{2Q1=GQ{LhkZzsLiKO#KYS=52>ZNhujKuC1j;fz>u`t^LtlvTfi zY+3~Vwc}RyyX7ZP1(2w_I3zV>=31@9g<8 zeqh{;)Y$wOtV2F9l`+HeR3;CV?ZoXb7CoS4z%7|F)(Eqjzh%+IAa&<6Xd<0@l*XqQ zhvC8EJ!f;5)2n{1Xw?$m*i1e38ST}KcE6NSwPsXyh8uIJTQq`Q|8jf(i*Jw8@ksx*nV-RItzJer*hZQp%y+V0uxpHb#DZAk=qq}}5ikzFX~nv=O4!~;?0A#0CC1yXY}2Td?2wefI304JTE()}C*f3DQ3 zolIZL$9(ck@X5G7CRXbjJ}a(G!dyFHV;0xIHT4fqlZSpfK1vAr52*q6uJTE@ z3Mcs_-`z)CRQL;8Cy**kTl{!aea9m=)Y7xQ-82ooMIP`a4!BfVLjF z^+#7}45>*LSMYt0CdDHX2X&AQBMJv&XnMW3Q5-bZ%(XE$uf)B?p!KN`ebjRdm?!5; zt?S$9IG5e948hDQ^fkN{NtaO6(sHOE>WSXU%cziau2agte{BvQomF0PmMI)&Q`67s zkoek0$CHY15e?n1bbkgprWqA$= zkekh&r9Y@X_Iw0qTzZ{^!j92ep>S*k2pHggiy%#_S}q($izWUFq5N=M+qtjkCulQ< zU=~q)uRUM@JTGE6?V|8}cd=G2(6Bk10=HWeGgChjCn%k1|GFs9py-o{$=6mrEV!>` zTEW%$bu(5N#-3e|pnf0h1D<|tg4T|3Dbre;NISSo($FwUSz8!Jpfb*p8`aCf!23p@ zZqoLFt9Dh!i(C!6YaRG2mK@w0tbatgC*O*`@o!qKzOeHKub--u{KM|Q>=pZ~=1)vf z*tSmyrfm=NNr=M0!2h;h>pK4FXDjzqWATNC0e*S7Pz~nHeE0OmOM{6sC=f+JRCO+4R(>I=^5eeBuQj)9|ZX$SAJMV zTEUug&1!V7_T{l>EZMTVibX+UqD_d`A7H{oC0ugw&lU;Sq{qGL&>O@js+C0jeNA4- zhW-^>R#O&s1oA4M(H=^o4(xl>_!pl_(;S+d4H#nWGQYcaN z@^}hqY)@?N)xdDMNkq)=@8^W)4>6pgU+J#l=XI}c6gbjI)2esrE@?^^=Cy+7jgqfy zBb8%`s>+n|lrp-?GHQ~`Mdb)~YKkH>Pb{xBhd-6^BH8b_OS?wq_R#{Q9qSav;i)4l z<$?u41a+SNu-81h0U!HnYyJDezKnqQ&#gRP#`R`n|9fxyzbI7xxIYp1q>7XJM}Z6~ zsiY$OY@(q$1{5j3Q2PupIMwUtp^q2{4CA0Njmn+(qIe0eE(G5y~sST=1p z+NiP6XXunc+h4}!+_AfhxyL;2o0tb)=O`n;^H&I5c!2KR5xet$P#2qv zfoNJp?-lE2R581ToB7x)4I6kgOR<|e1m1+iLkM70=XT*$q#|Cw^a$ zVwIqk-vW!3^F_TGz^{d;uHt{{7aEhUNHtUQ3R1oIMO_|2apswn5n-O+fAI3krO*a% z_}Gpa1UdEw_Cda{X)hW1>*0TKsQdU1h7f7FrX8fvv|05aHQzousadzk-`Lo5bOg=c zPtgs|H(*?83F!>S?;BhPC%AQ|JmcKS@hWnx1(-=inUJA^JabP+Bx(TlQlrxBg5gr) z*SL!o?qIUHd)}COIBIGNPeUjZ(^NIZd6)jl62Fe#vVG5c##gLPMrOGD!5`3>CW3F< zg3sW4!mRsU`W}OcU56jH6ZQG4Hw49|9bCNHSr+sNXqZk?RVUU}hU%A+nZ8a#*^Ro* zi>bZ()buXs@egbHqUROsudNXNcs`&67(vu6O9UIn0I15^lTvb)Jo}Vdm&7y`M4Rwh zgqmxjdoV4?ixX?-U3?3s&#*B@vg251anUy^_zqF49tmV~_%-`Pj*XIaP^hMKjSp~2 z3&K$P`1B8X#eI39q&wLWqk4g|EmDYfc@<9A?MK;Hq$~-QjRQ1k?m$gdg%zCV+-H!9Z-uu1@N2*5?ZW!2@=z{D z_*wi8Bov7W_}7D?Z}O{_>plFm+L=u8GYAB&#r(k@J|On2r4d5p8N(_|^xDQNAowElH~eif?zd7Sx%ZM%qQVfz|nx z)|T+l!tg40=;$q}rD=Y_$s3oDmkO+HfA~#a)(m0!B}*~JkH!GC9HM7cB8U+2C2=R7 zbvR>&O+Sy69prsMC=<*WFfpxL>O{zt$G!|gwZDG~Rba1o#GJ6gb&P{fkZDh@A=O}d z*GmHyvt^_fTnC;TwcVZ5i`2s)+-Z-j&c8pQnh?wbyFYGEe#-c%7dx&XjQg-aVjG0e zvx?QrWzS=dmZPOq!yaM=Lfr1PRa%Uq=eMGhYmxd}VN;?ngFF#P+{Ap1izX8gtA|8m z=K8ymJUdKR!i_n)d)jCGojYt#puTPrUB55J%ewUc*ei#X^FLS&|Mq2P{STH20Pq~P z|Mka&_1WS5Z>|oUFM1rY{@Sf`$deet-Dj7a_>3zm}x@zz+rzl|^qed$55YjKYnqHn(;A zWF-~f%0GOQ)ZnJND3m@v85(4@B}Qt#t&WF3#zw!(h*@YPV`MJoJYp|4rrbbT(1{VJ zNZtVX0Ge^#<3cgbo97a0K9Ilm6FSa&mr>9bf;j3A-}|C|8pkix1vX9&brwYyR`p2^ zPJkKA|S0r$9{?c2E70f246%CT?GiE52BBO2XPrg{=KLIu)Ju0 z0c`C5$qUx~8x93`A|9NWE`;?X*OItvUryXY)pm@`PTwVz);ZUmd#{av+3r#0%o^fJ zSPvP;uxD z@=(LAxJVl(@mDn==RxqTFqlbb2=bQG<#2Xyg*PGjZm8}#PY3(HQ+D3?Ph#lmuUOdG zBTAFga*?B}Q3^X}ne2}VR=1$-6fj4oSsW&N3p7y=zkW>HSet3FZ+e{_@8?ln#FaN& zR*^S5ELPF`*cgbMKC*}1mumleb_B5e$AS7kGfn1QMENOgx7X?g(-3<$1czqbpG2a9?4_n-)^VRf7PB)o(f1QGIT+si}r>pD5e zLFLS5uapIxlS2*hUd*N#>efv;3NVg`mM!|+wVl`4uOdqK%2TSuEm63^ttiE?32*|b zF_|2yB1mMmanSzyQ7s{5aVum0`KM+yzPeA>)ZxSHvIgF$93dRis?N0tko1kIXY5!L zLWWHk%Nm&FzHI}#)2#4EfFTw)VhnC@8!3(uF}L%J!xGsnE!@C9tsx1dWYf^jgWD1U zZYbC1Q9K4atPqR%YHjgtoVo;tN%!4-(_Pn#h>rzt`1~2qlkHT3zPKbb^}!*}+d7Db zEbrom@+R>!h0M~3W)!a?b#poLScJsR6jLae5eqtAQt9#MeTUgMs6t(C?%sl7&%dHr z?VG#_r)ga1#?@wrF$fRjS*2-F8pBi0S&=5~pD)mV?YlwqV6Lr|VQ0Y#r5F~S`!UU8 zD6!v2xddw>l6Fe*>gxo|`T$!<5o;;J{O7TIn)M#_fk~C7xRK%3yPbwwi|> zrU|^tI>_6ff=Dx`)kpXVJ?*2vML65bBAku=mn^TA$Y%=|Lo$;HeUI96Kq-(s z-7upuC2TuC4A?g327KnROk}{52^vWO><3k=!I;WEv@m?%yzMR-$T|DmMCKjtaE@6?sM627sR6=F~z`pyHSLYg!Iwt zZDfy{t!8@hU8p~{#lX;FwIue>%BC#2Twhgqi7IFWiOFP;LbB4q3hhCmz_p=|@k zlN#rEee*#%`1}=+^|H>#mN)!Waa!YvS&}l)C zIi@U0O^dviljaS7i9UOme=&-!>Z}nD{{+H2|Pc)W1T{G96_IMVK~UI3a4&% z5qjD@3EfDX$CV#MfA4y<$Mo3b^h`Osgzp0+)%>;z>@T}r+1Y+cq(Fv$9r?f5e>vsR z_e*=j<)sXO+l^Qg^F-f_WFsLM;b)S>V!V~-yA-CB%lyjuL@R`(PtdKycYUanJC#qHMKt}n1)nm{HRjvUj2bBfaw!MiZp@l!HL*Ng0HMsJ$Tc?K&>51mOb_AX0Ts%(X4wAHK}i| zXrYrgi9T&ArtxxT$CM>%BvZc(SzfL(&g+;U8mM;X6bnagjT-z`$MoP7J4<2^KX)xJ zox!4LE~76-8k45-D>kwsUzZx~su2uwQYhiXr%Z~`R8o8}LeZs(QqI6>2HzkM7DIl- zq8fGTjcatR*@-d6kB$C-Lj%{{vIM8!n`s_V=v6!WhTa{GE-4VLsm`6d@M_1Yu6;xB zgqRkl(f1EK|DrOK9q{YUC&@gcvafFiAejw>lJ62GX7cvQfbvf^)nf{JLCM~;p=GTk zDxVP^i4o-#+57qY$3+RhunB4b&QPAoA6c)YA{XHiX~$)$I(=g3rslpJv81S|OS60T zQiAE@H%~Q^yk$DnotTm>%V`*vF@RG3*nqDn8WC{?E+rw_7|<%}kry$9I+lvqYFG$g zA9UELLl=RZx}k9rH-x;Jl)8y{tLz)Mx!OUSs>Yq%Kn3k13P;4u2tK}osnI+)^%dIo zy0S9z71!ALt*UxC-yl4#dwV^?s+_Q6gVtdWBW*XnZTDGsu|q2)7N_(d5BIT;tusB1xnJ>vq9$e-p`}2C2h~Zs# zal@=9_T8)g<=pK7nXw%mQHC9O+5A|@4iRT5=l5|AMg!SM$mTazibnjrOgEt_Vfy&K zq@m079a|on@IInmB5?X>sera`K`9pDd1Mb?q2Ke$&mO~Hvm#*;2Kmv?cAyqfYiGc~ zJz2oh_m3P9th?b3nfvldY5T?c(fjr+{I=h0JTGdw{bNf$c9s{tG6C$rVAa5uA<$_G zrTvKhCXFbNfVz(dM)(NrJQw-!2HeE*1n#X=#TQ`9u#P}^U)U&g3D@l1!no58@Yy7< z*MyVXG=U=TOBFM@WkAT6Y)}!)mFmY|*5wXp8pUw1);UW@0r^f|s!{;y8aLo}*L8=F zOK}9X=rd=teL~QK9J^13AuG+Y2y{Hb)SG*DJlRMqSZO{^+Oyksf`u{t8deFU?-f7O z_rL*47-)UhbU^x^0-sH6)xt((8aLt0?!B^VV#M3t!DwduDs*2uwyFu9v#&Zy3nynO z*RsjWU(vt3w-P=&_wC>8J=EG@HiB{y`+eWpUUbd@fL}CR|8nR8Qf(e0`HR9xsDp3F z5GeaMMKhF}h)HCu)D^4yv;^+X$V;gL2qDe8p@A|K^`3_%o$ z%O`i>4s@ZiEju=w79N85%iGNIT!a?nK4q2X60S}C$jck;vIlEv3a0IY(>v#;;PWta zy72zw&qiGCk5|n&@GLttxqu*SbI5$bw#KlWo3A(GqYgB z0`B-z$Y0ezDi%{w>dVhL4ciu{k0h-friJiu(C)m0yLXUqf6Uz!ExK$40}Zl8|9zPN zFRDiVvB!gr?Pbqoj$a^k;4}G|5C`(CubfnF@9REGp9%;6@$<+%H)HqpFq0j~&3Z04 zetQvV8X&xjnUe^C`4HwzoX8^=sTmG(IKlMTeNx?Baa;taacfp+sbrelqxUT)2mF^w zX~FQGfY-4FEOQ^SV@4-G-&yvOXWLWH6N1ycPY1DTUR}G_^J(}fb%nFOxt1K;Q?AI8 zjDf|l#gr*<#FWXysr18T<0g@-B2n6ma?{~RrM+M`8Rn<{PCjV7<|O`BN3 zw@ojxh{HuO(yQVVPdU#ri@3vlS^iLK2rJ!g$YDH#Xk`xv{}7ukp)Cn^D%hCg_#tDv z^V1FTa7fJWY6v#&|Je^?py1{u#5y*%U&27{+0)_KG$2w3gf{p)H&8>>l(z1t4b3~# z)RVs$%gUCPo`$8OKv>^51nm>U$zMv3{9xJpwCR$A47D1J><)7#s_A<4wLaql^xc{n zen&Fnq;wGUhg~ig2a_HOUFvMeA)&* z4E$^g%<_l*>}U-p-_1E4^Mjz(?ftcd%BGa!(eiXrw2C3<&kxEWAH)NT_gm;kCLy`h zRs)5r`&g#%zEVUfmnAy&6NC4%^Pj(MC>~8q=3C35VWW-mZ#72y0xa5jSQ8qikaVfh zZj??Qga{m0t>G*r7hrrf(dLMoF*{2{D( zUUoYFo`i*g29qcuXHU;oB~eSJmR|8fQn0&|HkQl82F{6a<22|_L!YXbYeI-Hvd?@T z#Fv~u6Slxy#&jI8_UsP!dhbMID*ci9>Q(6R7Sc>G9l|julHVD=IY|p|G|5m73QY1GV_BbdreERPsobvZ1`~V75 zX-oH85@zRk5vIfbD=f&bB4xYFg3$hm`Q0DX0rlN21y8kg0mQuWvRrgwR{Gw zhvft@vOc5B2DRyn{S@bjt261F!a4*Qpb1ZW_W32nku>Y>xf2f|R!MJ|HxsK|r#bjT zCej1vXvmKO0g(Jpnf*FjkMhBzN1(M4fB;#nmJ7b1;<-$+*Z3HZA-naWjRs1TST;=S z@7a=c7pEgomH5I82hun;EWh>JbWs>o7dsGqW*iyEHQV;oYwBGQ>(B%>nJnuKkbAUr zd_p=E>YmP}U|2sM<{=DyizH-uxkN1CwiI<^c+`rT>a!OJ_)2wGHFEA#o8m_ZxBZ;Pe>dTl03L^_!Xp)I( z&1-3#hqT1y=GB1f1IB_1)$Rysk=w;*2V~{?T*p`>AOh^Vtq7*L+6UHyuN_I(2xW*sYB^WW6Fm zuGS|LK5jy+VYe%HGKK1Vp9W-OrJL;axlEm?d6AuLue>w2J0d^qJoC^$Eb)t;25i65 z@&1cHvxn*3#Re4=a9c35)C;tIgqwDDV~(&6iZ}U|nM8Gvx5Y!-l*s3E(XA2FpX3{B z>f5~sxrD9=fRjhV^dFyPw2qokzy0Q}Bgf>ZqRDXVHjG~pxL4kYSB)0?Qyj?2{^H5i z*7%7 zmq&t%F$6R-C?YFHA%Syh}Z(Ea1+G*+IHs`zG z4Kpox87Yma;Q_N-xw(db;UZnI&DnsJA0Ex%Wy%c9p|AD$YCkA5BuCmDVUP9`XZ06t zGC*du)9|RTG%CNx&~yXy&~(b=OX3S1*?qi&yhu(i`ojjj=+ep~z?Je{X`PZSDbv~)3JA<&JOEA6BZpm>PJesy+(wb;`M?0tuIQ!2;WLcq*-ZJP62K3%4V3|9I|PsG?h#;V0?{?3LAsRphZQ3!Nj%WH zT|yX4A<~DV^>rYnr6$L3bX4TFX-4-Lzq_OXXqJl8RrU)M~(~TJqLPZrOT@Ja^gVa86>z!kqMQ)rQ-+b&` z5M08N{nJ9csLls){7rx&_bfmOxy>|6Js|6GI5Z22SEf#F-;X=I0l^vgi+~hj_b)}| zgE-sS_{?N$N4+?7&e{415;(##P25M__SgFkv!Mjiidv!CDSkY#5*8T1XR-a;aRXRm zpyjvg-lqCuR?5jmz$91oq!nAwY5A$q8so%|&0s1aVQ%OUQD;xoQ#Dx__R*WlNFTy^ zpIM-HToqF8*tMYyd1cQMY=mAKDl9!5QiUbAaQ@SEncNierM7#|h*f4qtXMxRA7(nS zLPGWD^do?y)9PJj^RTza$U4`%dP?1GB7LUyL7?{%k0V?;;yUwTg-jXHMm2EP?GM*7 z*Nd*@e{M?RdeNQ7&hjfhlqBQWD+GjBf_2v-%zG#~v8}zj5E8jQXrk5wF2z2{ z@SMTHN(qN2m-mo;_~l`ykD)+Uy=W3{ZOxLuWV>!0Z;$N(Ojh zmgZ>as~PpyL?W3@;R&47A2O3O^^Peo1@(Ya40|j{-)Tn8C`Bk`;$UBni~-&{@u$$_ zM`l>4#oiz$by__lF5=Wyec`}U57ad+c4p`0lF)7kJ)I;k#0t~7fY<>1MUfix8Mh9~nt$Hh`*bJxw|EVNmD7I>r8 zsCpUy4ui@GOM7tygS&gJ6~{h^7LxgOY-PBUj*zCEy^Eg(2TA**zu~Ui!p7WAw&1%9 zkMCeVkE^eK&vRTaI^Jx5)4C^(It-8?1fQu2gJ%m%zEX{2ODD*Ds$LSii}TrLs}Rx} zR+b*7yiJVTV)L@|uy{%=nEp0Z_+>+N1*RP=49*^w2q*A^iP~kZ9Et@XJk%#YxQ(hc z*P1)&1~t4qN3X<&Z~<`$p4X^%9kcosOP*h%Mz8PSPE^5tr8~()bzGv78iVa4BD=f2 zO$FsbUE*8KXtm8F*}%{Ft>(CxEQp)_-LK18DJxr)P08>{`bk-p)f2Gm#_+eY-lXb* zbU(7-&b)ly;;6^s$QoJe>v<9KqU()b z@1f>TLkX)}>;cirdM+chYUj_p*Tc4^BdQ1yt}Y_#1U)qkc=X70PLwNpB?B_;6WB<_ zura;Yui1UW_$Nb|yWMwIP2S_99rNF^HfLHIRXdI8#B4T0VO=Qj^>IJhiua-ZL=u?Q zGFFh=kuyowE039ZO*3|g86c;H6p}66THc&!qWG~RT#~81%Q06R?Dr8)a|wGW^y-s+ zb!eXsmAD*#qA=IxrP;BfUY@SlJ^HN+^Y}AAd#pB1pN2OhH=KsFw;n7$=pbLX1Uw~k zDV}`zhhvDc#5WRWQ&31}#klBLmJ_Ldm zT_=9YDwfuvSW>S+Rt!fzxQHKO(oBK~eW`)1QI3bL0B1aCVrp8fHR0^5sbIzGZJXUR%o2@{5 zKdriO?E1d+)ly}wW|~S8z_&D>*e$q;_}S*5+7DvgmgKih2J)g`(lPzV7BZ|aOPK7x zUUmOLh3W#CpK;{(;y#vW^gnu%`@V zO8&k5YF}#!&zn$0T7q~JTh?31{032}OqBKRLKt!|l(JsDM~Mxotw>d- zNH(d3-U%F^Zj;50HlHH}tz#VE<;kg+x@2Uh?>w7%ZhE)#(CNq*GxRy-DL9TEJ`$lO z*|D|I48+>d6!Du*BB=^#zfy%=;92>J+-i_LJNpc#EccRh2GyIHHkQ(~;xg;Zclw_w zG91W=6rl#3MPh3*e7j0@T;lFRg4&84!ZA(R_4eLdu<(f9^tf^fCBl;kO=s7P$g3sL zFU(hZ`v;7`7=aih&bEYYtK}L|5qI^?pu_ho@+#;;TVAwB4KGTqK4di%cp%k#*6uOD zX|X%r2t`Z8;QrLjJ?a_^UA$x6My!W1;6~zdkO_$isPy0tVethy1%Ww7nxo;>^Xd$*=n7_xyph z-=mxRg^lOGnV$T2tnzTMSy9q2+~Sw(GO5@>e9(*0BhLy$1+6iec`S9^#6j!9Soww!^8#)id~)y-Ilr6&7_3 zP89O*zVlv#LaV;$-2g7F2<3YyhS-CmHY8?G@pwo+7tVVo+hQQsRG<+!oyX_tm%cNo zOB)B+@Y6R}Bb@PfX1U9plpl^pRsPj?=08mP@4oZh-Cy9}11RjcEz@tS1YrH2-CqH) zzNo+QHz)LGYbT&lJj7XNp1>q(VBlr;dfMW%wNv1gyut_Bh7y0}vWC1o+SuGk9zLp_ zut?{DZZmgkSIi1P1hCL`u~NTh9J|yXdgZ`=YsMKih32W2N$H^Nl7%c=9;eiN>cru& z5HoEea~wdb(ZmVomOn3e=o52BNEBiv-Ugl867pH@qcQzT3RxGw=mdsHYIO+q8y9dL+B_RaPy^61irX zc430I86-i{A$NuB(Um9Qy=|3fk4p$fzOQ^{z6siIjBXuy6r-Vbj1a$5u~GcP{=ev= z2Xgm+rDXqlN^JsK>qOW_`Uo!1$~mobp+ok(K6EPSwZ4nhfw-So zzrrzeHo?XIR40sM??^Ghp<%vVHDYT<7%cmj9Yw4-b23;w@vttLoxOXbZ&!Z2opl1C zoc&$v)w3PN1~<7_$?F;ae%3YTxh=KNFm(pS6I2`hC&_7_`u4C;4)Z>LvWaeLhOmj} zkfTvmS9AD2PG9)n| zWdRwK?oSZ;%ZTf29KUw)5~Uo02919`ne9{3*faNvmHiAi{4$_;h&XT11F`D+8s3x@ zh_6hF&%`|B5HlT0XOQ_~aO9}vc7)5nUimIzM_9tdY^}(PPQ;DYvVdI$VWps@-10-H z0d7m-0GOkwiIx0n6(g!9rtqflAn1lO=A z`Yf2&5!p};1I*EfKd|8D47n?fZ;TDgGii515^6SDG{Z?b*?lqMSS-L;16qDE zURa#dK$u39$5dVR%v~lw^u%6l4qG$V+dQU{~Xx$6>`h+x(@gPqZvWXx#7mk%KL7I0KEnpJZMbPGc_ zEe`oDnAu)Nl;QXl0@nSvslyS*U#7hU-$N;L-O5=(MhoiV16Ccuv>lrm2;>RFM~9C?xPwVR9Ujit#?3qL zI4g`su)h0KZ^EmpR9(f2IFj(vQv}s2O4rq;wuy;!tR`Tfb9`|mK)*|V9iZ-Np294U zSiLDqeQzKUykS!V^utt1d96#u&D7}Gq!gSU4PWyn%oOgYhUz#s#XjIM%C6VG$hsTZ z9jx;`U-BvyoP%h6b&uDM4nZLDm`&VIXw3!mbI`p|ttaGHpa~!L6;F1M_iJ{l z8*se2*wEbvPLIDU9tfN)kDLq|lk*d{Rcyn>3E@-V9ZRq_1)djXd1*fqN+!}5z)miS zofLj$qAN-$U^!Omv^XOU>5ysWi(3t~W#?YN$7-6&Ra$v{Y&iAQMI;J6Zp4~Q+rI<3 z<9_Te9VHsr5V(W95h}s|6*+k4oiLq2Zy^f{ZjSree%=Y`O}cF7u_|#IWNgM0`Hm-pz|lwq#B8zXLfn<~Y}77xZ+`SYLs>+d|HkNct7+yN}b1ALtnqx}2d*7)qlNs1 zKB=Ygd~okLKEt^x?cGGIh^aCfcl&#f^=xetl?d70L0)UjN zC`DCpZa4=ZahWRrJ#%bXi)X?F$Lq3-0tHP)D5*gerE=K*%+NP_)Xod@$hONWZ?E5^ zN%SyfmViopDE`inOf|5U7!7{3YvL4SCebz4amL(byA`zh>Gnyrvq})+M?L0m*#Yn} zUi?4yxdV8a@`H`@m&X0G90=%QDfWzD#M80&dQ8uyggid2Jb_Vn%2x*i)G&?sMY$UvIZ;ZQc- zdAEVK*Z#bWF9rV~znh^fxPGpxq8z}l{u3aMIOH+s=ey@gRNed5ei}iv5tOejp58iL zQs)N(MC75sTX}&^V@}7Q2(S2ji!1%4JBae3hM_P`vF!bi_c#u{HBbaLt1MGXl#4Z1 za|CH4u`&iQEjw_WkoZ-7c#gevm#;2$&q5YzSZ)bTuV){WA6Km+=fy8( zHiOGjaf}+4Ch^Fs?mvl+=)?=W?O%e{VQ~|u$Yqjhtr~%9^OnZ>hWve-&JB)Jr!vOw zUG>iG9rXED$=Yw>#`Z#f`QMDV|Jy-c$n15bU>3C!r2;Z?@U)z7Y?VXL0<0*yJ*j;d2bMuhr$H6uKI4+?4l~;X;4?Xvkxjo7 zdD?%h87^U4qWb$j{;`74}Aw8jHwKjvO~aH^;i;3&9D4e_BNLA zj}bAmSGPR6c4FnrvO2pisJf;? zG%4Cg8Sh4(wom`L*-foxK`0JMtPQ!=-Kr~Rj6(BPExfziIT-P)5DZ`T-kxwMB7%6Q zz{K=dY1cRPErCXS1<~f3gv&&c=ieknWg-t|;QwjLe zoP6ep-#SwTu?E?~+*!jtk?t6jINCx(hNq6U{wbD5yp~0HE?^vav0bXhlK9XAvkz0p zTQtl#%{<&`6^n8rq=6r__=cb0G{5IFyLhM)*n|MdIQ-nK$v{uCCVF6wPZfWCi-GaC zSMEyWO7O3Ab=cnb42F4~P@=QxQm#~ll==*wfyr0Ly7-A!LUl0)R`M+^b)LI>Ecb{UlR>!<7%X&5S3s2heH{Rujzdl8iLow1CI*Yy*$L_I3tO=?apb+P)v#%_35lJ$zk zVFtII)HkjR4zFhifcO7lR7asRU|x|+Y! zD!9e~&TW#qC5UJCPM#3>KXpv+Os&3UqPuYwjUi@u_M%`VpK@`nwB!oXuPQens?_+U zMGa@-o9&=r^+lJ+=)y2#%YB2THaW3V==@}U4@ue@FaP_wd09v7pBoU|FXHq6rr46Q zr2yK0Eznrnp?*Yb*)ii{6!tRb%zEu|LC?a@FqpyYE^Lcbm}ey| zU>7n_LduXBp{A%0vaMm!6f%exHp+8Y00jK+f|7X)zaI2aB#q;nCIY;pIL%5S%ml~c zh!Yl+oN-%YB7-sAV;lU)L-hsI3tWt9M7pcXPbj$7lPcSD^YpqG`VjI_B}Hqnp#ah652ZDM zXFLbv8PD;31Zx1g<^b^=WU~ah$5kMnv+;L4=K|u7c#gzhcn;J2Z8P>|3}anBs;j=- zvy#KU7Z%veJ;Y-`Iw-;>)VmHQfp@jAxzyD`j<}cct^(asy}D@nMaeOHtp!i<_<1GV zmt_Okrs6H$-MP=DT{>Y`@u>46{K!&FW%^y2RPYq$Ob`P&WL-}XJi!+Kw`JmBec{FU ze{ALfxz@vVlTi>OOaTO~+V5|mak2{j)XcMzU<&j$w)2c;;jN2~(qAG$;O0TQhOJ<8 zP&eiJh$KSQypbC2B$1CT4LWqY%ap*y-L4_HnH2BVI2238?XCAv@W>HtmzhAOnrGRy zoo4Gfw^d{gM7@m7fvA_OEYRlL7#^lL?`VT_KwBq}bLc%422k&!XtM(Iyh;&3{aU$ie!ud+~3$ zcLE=fQivex^+5!i#Q->C+dPP*fA`5|NYk400A|sf?0LWs+6sVAO}^QABn(L=DcxoF zk(OMy%HigL`hE+q^pR3V#;j7iDma=FcH5d`cx*3iFdXFL_&GCNPR|E!3@_2yq+9pF z=7ELq8Gs8HKuq-1hXRdCpUyBklq_z`U`zus=`q3b%Qj?uHu*Z;Hwdc=?yXo+?fJzLDUmg>(KfntTIjsupS%^|>quVK*S&b}mp0#K}w0Te4Z1H}q! zyb_sOcWW9MK;ygKjzi7)za{RJB{|2J&xvwvRt3>%9+!^WPHzys6? z6|6EfX#Oi~JX(nL+zm(lVc^RS@8U~8T=wrIqyC>sM*m+)1{pEU_SNsl2k<}q`21x< z^nab-!}{xJVaC`|#Ao{3GeIg9M*zQ(Na78W!%y|IK;|*@UJw*itN}%V*%X^V!(n}t zBJ6b&$F^q`lmPK8&C0jN0%IG zT5BwS5Pax3^0`tFY~2Sv{y_Elx20!&nf3eMshf&&R=}~p9ee6y4qh60bvBwP-3@R= z55hKnLbBpqib*It-F_RaOxpXTTOH{hY;l9-H-#L$AV1IFxZ)U0ihE?9Y*PXSjhqbQ zLYBC;3{Q?|z^T9gW^QU`gP$uLPIOn>(>yabFWmlOZf><5hPy>M0f%A0#@FP5gn-+4 zVxG#$!n_)Zt<390I!a*oL)R}C9U@b3<+%!=O+!AO+ zmfFae_BNX|5eBZX`)-r5a z)HwF+&wS&mOJu(X!=Dz>kVy0OPov#b9WN=_xVnH{KOTrJPl1`7_X4-eJAh4 zOTLoeX!j}VBg8frY86`keZ;{*dB7hQJ3nrM=3m?`X5(nJA4I#b3dWRf3v6Xj~4#7z#~{c*CG&F;S3bdiI5SzgNrEDC9td&+)B(*oPl_Q19k>SA?s=lT&Sr=C2zipt za7?F>xs-r{*B`d*W}aM84x;1mS(f0tShe}Y>UnNnC&ZseTI)m1=R?}&L$uG|^6Vh! zG*jBT_EtVw2nKi|aq;jusN~3M8Ae`knYgrntRi)*g#XMVF3Z~oRmX&o@-d8A7HKnh zD|GQ&+uV?T{pt;}8{LgZFCBcqAar@^W-OH~bX!spc>Mm9YJ51OlsKrsHf7WMWa%TQ`aWOM(%2r

rX ziv+k8Ntd!H04F=3$At}g`p&7(7X}`NTExx!^K7yt^E96}ii=rF6g7kmx+J$we*6K- zITCUGhq!s!x%w4&kW2V4dy{^hF8{ty6FX#oxtoacIn<$C2_c3NkN+>`zA~%|wdtDf zlJ0KFO(WgiCEeZK(kYz+Qqlqv(%sz+f^J@t~y^Ew4Mjr*At71`z6ot1l@Q37*m-nvjx#6N=;8)c&DZFk(0j5

;0ot` zAWX;QUyjb~+81!ER#7hM{%rQ-wwl^oln2A1%fm!DJ{;ef$8DIhTEx4cIn(XM+HRrC zt8~h<*Iy(bK@hYHo%3@Rw-!Warfg;ucKy)7i#B;pT#Zsz&b10oAyaa;@A#IZp?~4^ zGB&{v$g&X8RjxT_?_VYSN0oQrEh9E(e^}4wl}U0vvQw&Y($PSU?FYITtg!CB+tH~H zYK%alAf#F}dC#Om5K#sei*W=T-! zdU3YJ*>hMsH=)|pNAMx=JHVBNywR3cz3PqgT6C(}KlkgF!qH?;=w(#t$I)=tZHX7h z2sFX(YCk%|KK8qj9lfwPzJR_TSAqV+T0E;po#iouq$-fP>Nj=H?>mitzhj~3yteXY zDd!u+=^$gg1d>^&lU!O}LNt0|RW9}Qc246i3feVZBX+7xRRmIcq#6#0sNO~=3U_D( z-?*y(O$YP^_NpdwGhwRFzma1;5kQsjZ1Z>Zr)DQ|Y1e=D>Nm~NZTPf@62wCS(pAiM z(s-+~du>PYq0h(Eu{Na?XOdFSQ$&tyS;{xs{tNf7<&caChFN+u%fZ8Xat0#tRNsD! z#8<1bRS4w6$KT=lPs__y8n>n8SWy?NPHKvqY|4c2`kgIn$=mvw3?^UHE7o=r(`PJb zR>6mGHHDU%Sur|eC7bb^m!W%Zrji< zzr}Zu5?S$2l6p(t){dhB}lH}A+gXry!2Jez~Mo$NkK<~WUKs1G9 z7se8T&gJ;hL|Z<=Xvr46VHPTM>w80z9l1Q5h$Fu*C_<|LQ(jw^=KJjES}xnDsRyNBorKur=(^+6^zc zyV#FW6{zoLd-pjl_u_3})CV#UyC$S2gF&J1s{;EdJ38QeK_n!n=IFU>%@ash`XHEiF$t{0B zsBCLS24Wh!tWB%io0+%i%{>-UUw(YRD3q3&_lLXntUwaL`pB6FiU2!y6F)Hc(ZMM~+WL9I@FGr-}LUFow0OH3`+0Pfc-{gik zjKW3Jca*~xM7K9yXWN}M-GYFFnGPc} z6yfLPl?$$JzG`7Q8^jDEAB=7}@z}fgFn6o!eFQ}kdAiq#I0vTQ#i?0fO3o^4m93+W zrn0VA-bmXU{)R=`oRD^?>ZPSnB&mH;CU1)BX6X-YUa`^i_OZCgFK5bV4d0!1w>00_ zZVYQ(GVyBf+D6*VdWxUEoseQ8!B}Cm`3zff;tRSN=-vBdHCdmB#r^XbK4J#@7Ap=f zgz^o-dpEH04&=3FQ-B6)mG{Y4^>|@8UWs9*S6$yGON#M6fR7{FnM8tm+9dW3jOvm) zbD9ee5>V53z2DM{?tFneatMIL$D7jX#0I&0yN`YgmR?;&!1v<%2*c9`YTjGjW)r9- zfGExi3fIX+{mp3dqrIJ>NcKXljmor(M(qT!lAwk&NN0O%QA{&90S&c<2^>`o9e@7E zAS~_=`K3?My4t)Vw2pDw$~$IIS$di=VoP8Fakhs~w>l zWK$NjIdKp*({aqdgtwP=vHHWpJ*zo@`Jdh3|HjY*u$Z#HN__XAgi(??`WhnTr;|r! zy&o4J0Ry2pe;6XH7=Wx(Jg?5x`bIUQvs!MRpX+{X=&JP77VZ2>FLPu&JEJ-08aK{j zy*j&g4r)EBCAa@2AV1Q!&@3JMHum827rT8Ca_B4Fskf@N?>;1vqU(ep$PE*c^M7nI zV^N_jqv=n}V2NX#)EDlhmb8xjJcJxj<|ekW9(UnVFf@~B!Q#BtzkcbQ8DxInv~jnM zcRKWLVLKmvcFejEIL+Q#ao0+0qNfQncWROVa35P%JiTpjK#+ z)csP?W1FEPgoaak=gnPu>W_{?fBNV)rHVE0`ZxU{G#Vs$1p?YcsR5_iZ*>k4om{+P zr`gcjZ2P`_bsHh$--3Qaq5Fq~Bj9=V{U3RNIKlXCVi?hf+Jihe5rNSuWt|p@uWw#u zPZ*nC(h=zi2#E-oBO)CjF(4G22^fHXXYpOk3fc_(^n=Y)bDC|04qcTLD_Wj3LH+{%*Y(*sezAohz51ex9I8Jui zQ-AAmqZHMgCO?PWtE_3KqD;wma*FHOLhp>OekH|+1Nl>lE=}nEaB`ky$yrz*S@H*` z2H1Z2J1jB}j{&{m!HN1^o)NtKUXp!4Sy@%z$iURlF~t$b1uB9PDKwk7Jvc0KbvaSjNGXXRvCF8jD64wa`$8SQy6n*Q+Ey%G)GSvj?^R4~ zF~p{*;FJmb@6vbvTK2V#Yq*;;O1*58xxAB`SHVlQ5JdG(g(p}?3(2eCmnTy{;k(3T z*>8Kly9n}+N|0&QI1lh!l;23X0J9=Saw-eVgjY`C{K}tnYJ4{gh8-2ISdK2 zM(BbTjOEi|Gs!+>MdZyJyLIcfLuB&Bq>-n)!~Cp3?SB?L0=;F~(VRNYO_+~@DI!#QXm>XY{{Z!^<<+Unlt~G~yV45~Je^$sjf>aOV zfVo^G*tM$(*;<38FPfIz%trFQ?3wN3h6-jnskU2Fv|E{cvT0ZnNImEJv3bh)nuqUqQE*%^fQ^0RIHE)Q9OFQ zcfXB<^}t(lm)4l@WdQw(ymWSGqn)}=OJ7gO90Fdx4lev9v|Hc@hHGEY(&}`mCkF^9 zK>M8LP@qP^-(wbDAYTfQxaRlut`NaF+2J9Gs_F+;UqKR@^e7wcPrV?aJ(^5mgjMw) zKweCZwdLDduDB(Y$$xb&v>R85AxFxtH-Z6JhnHvhiluW!j|2))NRYxpEp79`aPQuW z@32lZ6KOGvj9}VKK@4x3%e_@hi1J85yP~>*HUo;8TkX?eVtaczR`nUebhA!8U9vt( z?;;>I-_Ny?ad9xVbglok8p#Q^a4mIjII&2w>6*T`s8mplS5(&r?^orwk3JyrR}xPf zOMvZT&shxS$FHPl^nX(du>v$oUzLq`cJDud$(~OVbXF~GhrB(FZ89_p-$R+#+64!& zo-wPZ@=l3$+bBFONmCqOw(_u`ow@n2~!vRBZVnxR!2!JiK45m z6X%es8BLV@{nPzpduF=k5gj5MaL7Q^3j84pqS7fhNpU<-vQKh%??SSd$pZy1Y-hPx z+*g=22q!wh2yrACgCaxRwFJjX5P!j$J~~e&3gYtdN51g*5~+Lmfy>Lc4VoXQGroUX zfjCQ%@)jD}zf2;j)BX<5Q%+pG-S+c5c>d(KWy!bZ=j>FP1L$? zd5H*cF85=Ies&_h>6&CQ_`}SeWy=6ek8BxRtYkEhnNs+YOO(M+gc58g=f@AM<;$O^t@am8gJhOmBQDh-ij~Ik-+XyMnl_vamKNW4_0Rn!pKS=+2rQ0 z7%0$nM)bRe?5Wzz)~{?1T=7qD-L!JVD^5M)w4~`+IrL;5fyd_GI7PhgIc{1Uu5 z$wn@`C;qs@Cuc`Z_rPDIKSFPMT= z4Qi>lFKvh#S2T3|$vDI+?I>LswlKO1PCP+DTdSdoXR*Qh}10G#}Uf}f?dNAJ^h72cY)P`F;Y`syJUl;xNBU0LjjfSDoryPP`hCmIU zvNFqSXGX-#zZJ9nl)mLJK}UnYHjVL$R#L;z)AQpSA_v!UbM+b6q5DpXPS7Tyhg>qCzXb>QUf@{!5@yBN>v$BOX#?j2J@@sUgUxnHfaM`vuvCnq^1>uHz zQT%ief0woT|Euu)VRhfcJE_^1c@6RTpzff90<@XVxH(2Qer__onYC0ufQeGpK z`%>Bb&F7cb6*VCwpTzDLrO#RbP|8B4E)z=e5}p&@LK%)&!4op zfV4CJJK|BC{b0oeTZfOs+JcZ!RQO(l%deY>%PW_$lyQQ;(_7c?X%2nTo0 znokG-Au8S{T;i`3%q+=!xzA+2IV@~2Og-|7p{jY=G2TM2wnKZ=Uz9&KvSeOx?9E^v zBUjz9@9u3Z%H`Sg;Eej>h1fSz`r;BclbVY`aLxX7U&2|Mr`a*UGfBbO9?gRdm>mNe zV~7Xs4Q$x^_6)OJ>IW#+8QhK~5ka^{)>JA*!oxJkSTC1BZ_(QJ+A1fZ{k_>m^?t_p z+9;^EAoc0)YlKAb>Ck5VcJN)U=ke6g*|j9f4z?TEML#?M8Vmk)d-XL+_yO;&ObsH@ ze-6~ciJ6N{*7#|YPbt-E72)71;!rccFwPlHP8$!||; zjn8SFh=33ffVj&)*RgwUPSB67f@Wl(pYQ>;y>9@-bumb9ju5?(u3N3Cg8PRE-rMds z225%^7OPg-A(d&%;-tHq-bfcDe2#keFO+^Q{{ro9GhBOmlGvYB#sI8TdE^&Hb0C2W zB7l3f2oY%rICOc9a@KR+x3O`|CyDu^8#!anZpN?SFHf{2GNJs6Ey?A}YM?ahNRVTTg<+cH_5>B?&Thz{g@2iSCT@HalV z9N1ov#?bX+AUJpqJ3mTm2>kom8_at-XD{vxjS6<*owhuuWc3Qj*q>?)1Cg?4opP>6 zK`mRXU={F`3qQpD8Wf<`Jo56gcRg7*c2v9Pz0E?B?WqjHr1|37>lV3`j5gyRcc)@? z^$90ID_tbBNZiht+3ynK2~}MA7e{UdvuL6ZMD%<7n+$FZXA-k%B!6TyD{s4nP6$&4 z@(|CnwF*XqyHz(JErJQ&`8A{r?vzAfbCg1WM;sloF{$M zzlH5cu>?qif*c7;N~Dk5E|v^Pv8S*vqrC?^E1X4}@;if?2(c4fuaf%VYK`5wt#sMWH+0|i_ zFJ$11gtuQhakTz0wrAa=e>jDIm%hYi`cZQ*U|12l@axmd*A3ms=%n!g7R~NZQ}ftN zVU+6*{khyWk{u!00(RAHxvx10X%V*^tR(zc!}-bR*H8nq zqwUclX2i`es1YNFU-lF)RCNcl`X!ghaK0i*ozE3`875&BPdUYfJ6zH!8a2HS21nIx zOMNLaQ9}G~Ew}vhIsqbQQXcb7xEhwn@>aPyWWTD0Ok9pbQ{1^WJs{>XSdF(0UV#(vqf%SEX0IIz2odzr0a zdULhwBx2kuSQ<^GqqJlv4sA?_3`DZ0!K8nNu;UU#qO-*Qnn|2f;K9q0SHygUyXTz{ zbsCzqPMLJo)lXTVg2wA$?JWPce@_voz3j$cw8CTD5>5tLC07)$Miz=z*r&Vvon<%W z%=yHZ0cFMNMarZK)|FNdlr!$ZONmI`^E~7PD&D6ZIRMsY9Z=@SD$Sw~G0#I9i7%MZ z&zOZh>nty#kr>z`YOkQq(>}}tml3QQqzqXvk-iiY?`luG@{`0I7TMcF*~atKm=lOF$mS5PmaGn7sq-1vQH>qLf6G?g-h$UyI8P}zk7lK3iI=b*76hJ9@q-;av;t?dP)(f5p6dyJixZMpfeW@{9Q(tx9Tg z;>RT<`eqvCBW26?4zp%GNWbj7?{UuJ{5g;^Mhu8){xIHW9l6Kl3@m_ZmERtw+IS69 zEzs3uQD*|wsr*L}lc@ur3BHse6uz9|zk--SUy!?>{`%*Y^8fFmbb#kQ6OWxj*->d! zV2d8aIB(%DyhboFx6=b9Lh6kjIGJ44cbcr(;dT@;oDwF*Hr|&rmec?QqIh8i8H9wy znT3}sU^{-b5tBaO1sAO+ZWdM9i!zZ8VYheTd-t!T-<=oqkM>jgwCUkneY_{Zxldxy z!q@b&b3{63k$$-q^X^wJBbXrIX-zxenQHHkIdLDbhd>gTpoeHlpH%*C%xKDa0;nCK zz;R*%(R=zUy9;N;r=2nogOT!3@tll63!uuH%satT(J!O4=Fj*#%bX?Kz&uBR&nHgX zFcN>XO7Q!3ZqzkIkW&lN%RYZm+&fEoTrDOU9>M%laZN40JeRv66M@3_2!o!)1idq~ zSq#AfXIRtL~4D!|xin;g1 zBrlXNZ;AuN#JI&-H^>xpgM-8j`h#U&1(Gp?QW?#=1nFiOhZv=*t1o9GcArD^*>4>f zu~crUJ=wlNB5X{bCQUnh_*rjWDS2>HaMmlz=sAfsumbo4wEDcPE!X3jj7lQ469e~y zx9}$x(~B3OXP+$^D}Xbpl-!7bHc(O(`5dAk8te7>n{ky;xA03MLScH!fvSNJsQhbX zO0EDcL28}$aKtEwal`L?%X=^HqL9zN$zru6+!OjdU2K+TnMLM*wBE+PD*ycwt93w? zLu{LU+TjzWiNCAE`NryjA9XwZ=vjTVqxPLkV^bhG}*&1j1J0K@mN|`T=R=kWOPw zdkF3BeM2}VGA|cH34=B_yRTM5$oftF9lu07UBs8p(w*Dq7r$P$ZWmDT?t({XzuNu7 zWS?ckI3EQxENpC#Q3k-@P==6X;@>!fwK1%5TIvUYEW)q>Tx_aoL4g2eKaVkGe>6Tr zy$hFum*Zdc_MA+({!fSXOgV6lN2nohj3gWofCr`^JK3s4dWqjf_Pt=!YOJDFnr_gQ|K`Es-W!R=k6$ZUr3adpRT)BJoK+^U20iTEwMh zc6tah7WJ?juey602xE5Q2vAZbYTPukfUN^+2t0B>jsNT<66O^AgXA&$^H7Gzy=|hg zg1;Y>O;vRUMIrgSV_TSq^b!VawBYmGg|?#S1w7(%T~jHde&GfY{6=(0&VmD-`Zm zoVOQPUq2I_(H?)N)jOjVHGjI<&rH`nPIpm63!(z!&fjRghNyyr_n3^$p#jiuf^`p% zf(ZL0Eo(LhrMHjN!|p?Dg?R@ln5Ns}LWihjN7ER<&Oe2{(N16C5^IG!d=ND%C#0L> z&z&K46IS9%+okdA)U*O(Y-u!X*8$VGBFlS=j1jwt^w-mYKTo#?2xLBj17d%B0KYY= zWs+`x@JQxYNgTDwlF6y@2&RSftcdGGo)++P;WR#905f}W7atyF zB3QiR!vGJL30N3r7*j+zjcND2yU0jPQ4BTcoJ%CsNN0s&E}j%CbI+hhkF<)N3TF(L z6)!TQJ8Pk$dB}vAeWN3*u03utS1HL(iusrKJY$uqmyE~g7ULMAgQFr}hO0#(>&Lv5 z8@=n)Z$Ks8#g3lNoAsFo^^w)!jedm$%zi_9$#p=|z03LyU{^N0!DDK&7!C`)H68Da z9-S{h{>&T)p$9>lcn(<;7c1#hHV|pwB{&nlA2ec}tHC(m?n_n;T|rznZ_a~fF8OV{ z^CQzopjI)`kKvG+3=ck}sPt3}Jmvza-Q`9+K4NqZvKcPCK+aA~o5IMScG=6{sVW74 zt=CctN)0lq^$KQw^;jq82xyWRHR@Z+?{V#Zg3^cx96p`#Gkd4l9zi3rG0Z^M9s%49 z2>dYV4xIw^$Y<^WWF>CTTA~KU4T##c(k{Nk> zWt*A?=AAtu>zd=1o+1OIezB zbrx-A{gM~~*qNY2;Ar^J&uiPo1(tM_Pb=8a&CsFHK7yn$T-hdy0$bk$)qe58PQa>3 zrQnu_7rs_8*FpG1b;nM#3Ka#E8nk}D`0{mJI1_RiD}Kpmb+Pp$I+cwS&cviQC#bfY zmIsk5ur>2ZOF|s5N$T7IU(seJnaGfTvg(HVqKK{g{F-Z7Dr{LortB7ve7YRW&w3R( z9yuwzLmh~IObEggO@$|5ar;X721G%ec{h53iHOyD(O&-jsNjcIJvP=vJ2B zpa($qbQ-MBD?59f(GZQ5MeQO6GROgQoSa>4+dO;Dzdb(+3rwV})eZkZNZ5BUTIxNm zpBO`uNN&N9hdAA=#ZLP;W4-#e`B2fd!d78l)!7FW?Yz1aIiwk2>0o8}{);hmpC0ZI zS*iy46hPNcBBxQmUE=@p2vNz6F~K&js284|caxY^5_$qWs=D9En1hUQSg}uaR*php z&eAb}hvBw613iO=*MRGeN|iN9YE3sXv2S zo1OfPw{Gl%B=Yh(C|3)v$sfk}tf=uZcB(qs0K`s#K}sf#Mms9@Nu@k`KJiT*bAz!u zPirjSEG{bGMFDL9CHHI;32G-=X8Z9wOQLm#YLTIAHQl0x*1+(dfMj*CPhIx`ZOcf| z-|Rs>MG2pF=>u4wl^0}TdHndsH^c$8d?0+p{2^*1e*WyPR#!KZxN716FE;$O5jU276`e{ru;KZTUg^nxKB)vBMZ;ODN%u_=z|rvm9n*0rV| z8a1GWfm|X~%^tgy?eI9xr$~;u?Lh%>N81M-sYsA<(B4c{OxN)e?vR~b3So1JUyxgo zOi_4$MB3tuVjX*!D!ITa@DOI4#F&`)Ffk8YpdJQBjH?jGSp*Xpd(P~S2OB9G(|)ur zfeMCo`{1o;CRV^O8MPaHuv+DKI!$N|+uljtN$+#vTGzHn;s}v!ZV7F*UrWfj4sSIw z*n2Ucf- zFA-NLd=i;O!Ax=_!}{Puy)3!!yk#L=LODMQWlbiYF8u=4Zw;S+dRhR_GHn0A(b$>Q zANrD&$Jy9fRhihCl*ZWr%&Pyv(d;MiVbJmbq3{J%|HaYV9FX0g{(9Eu#j6~Dvq0_{ zKs|OOFyL!-nL&zGG<|!`CI7;Z`clt96Gb@_wXcdS<7KFQ_-^W;;VlXvE{|g&48mp|+-pGOttIAP;$_p%aK4u16#{gDqTfyD62xL=IM|Kol&BcaK17#f4dw}M%2C@@^LxRmKW+6e0=yTcb!5mExWEN z4kY|@UyZv?C5d`Ud6J(_nC)5X&HNa6V~deR>LGprtODRusfl+z7Fq4qn(k|j!arX9 z9B6k(EawT9mf2y5-nR`B+v2au8UJB1VIeTl(PLc|1Wu}8>Y)8AS}~B>ymv zXKvi1IuN#)21Ib6Q|Tq21BtNvgC!=AShVU5o|GId!FlYo0%bwjG#O=2YF^_W31V5E ze1eJSF=-4~2VdZHY9rI05-J(XfMZ&pghWg0otn;D$($SVua2_xzV>P5E{YghIST2! zoVRibI9M-;MLQ8SChnb`TGIxy`4IM|SS1m?#s`TS%_(V|qdmcI2&4I{Lh%BXKz#?M zM6y7ZZURQ%cZoPq?O0va@r9jQ>(K=ZHa?v-^Ydo?_YA#z#zXMXEdV3@5Il&1g~&T* z&CrTo{5tduphWbndTTRgxaLggLfJ%(%(xX3AHs3pzrFe5o%fWA6$Un}D&@Fb5e=j_ zDZm;h8e=I0wWtP_E`P``9uEU61cb1*ZMHOeGObBK)%EbzX+dP`IkaCk<XW;HKqv>7zBuT$#y_Ogl+C|{Iy}}WLxMK!&F1fUWBuGl5WLL$b0OfI)s|mls*w% zVBU7creK5ze%g=%lTCgHQ7pA@ST@|ZHjr=9{1uAl<(&Df+%TP?fFG3U4t>^=9pZ^K22 zsv7`+OIq)uMVV$FnHO~Dpf0VpQ#3$b2O2asN4+T+l8S~_g;X=CPPzHO!^pJ-wF-@M z`E*RI&q72W+dP(<&kwl^c9nk>$5exS2NFTNm5K6ytIc49#zOoayuf8dM%G^@7T1_k zf=I!i1OQKp2!IHO1yBXPjDiO_pvO3VIu`c7xqJTyI{UcXNOepa4tOpg##`ia;IYr^ zd!Gv5!b&(dqY#pWF`ghwy8wMFr<9|} zY#LX0yxa0c2rDAgsdbIBnV_*_0pga|lh-g{fg8=?%xfA3jbXO35!A?~vBdE}6|xtW zFou4OyMBR%1mq`lgH{A|MrKsjN%U!*Ig@5x``$+a$rvvf{`y>L1!kI#Rha}`6?fH_ zV2tw~Oq)y284o05grGSzjjf+2R#q_+dyBpV$fzViOkBq2u-rFq3&~XfQj3d6q#(L3 zPmtl6Irl9+TI$q6^AP&ARhG75l&5BbkuS$!NU&0i0VEsaYpZp)kNU%EJ?{znUzG>~ zx*E?Z^#DA^xPf%awm=?Mh-2>_Z-Mqw?Ujx86Tx5iY|EtIM4%-h<;G?ci%W{?2brsl zM<|^7W7s~m#;lC6ZDHdYVmhkSNoRI#PQ)iNfX87gQ|86NzhK!?#EJ|M1AV`qiU4Ld zuz(+~$JxlmveJ&wqiwUsq^YP;?Lcyx#uV++Ys!j!`7=}u1Qwx7uMpAZB(!VBnU zsd0!72;VSFPMY07mQ&e*|KUJ9%N_w9ce%>OOP2$4zoI+3ka!gksabPVg(ZQ`_fycd z>!$Je@4P?*VPAmyL!YArTfiBdh)4C6lKIYb;iv&=E!NH z#=?Fw;+MH7|0@Qk70TBQ$?M@X^}dTn#urNx(RJ7U6c2yF*XUhFz1|!B`T17hOK+G@ z(lMn@ARsD`lB)nRy}-4RG?-VB82MlNXcZYK;zvPlQm6DdEeNX+5Ojq^Oaug zY=v$&&}M^SPXlZ=z_VhYr<8~fG{Qm0o)NqSp~O@aiGEB$iGIj;IdVh-$+P9zy5Tk6 zCrj!|GGM$COlennuLqpY7Gr-)Tw#)(10}9D&DdcGkfOV7k%5$mB~|H)4-!`l%H5SY zD}PB`752kh%gws|B;SMvN?d_kw~pCN9^!X0M*k&oRVmNWvUgH04&*AcF#>XxRml#M zIp~0Ow(c&M0Vxp+vk|KbK!br~f74q^50r>n;pH6sX~EpQg_}cb_H+wB{-Q)=VfiN| z;u|n&Tg*Qk%I7&O|GQS|S*{}M<3cP|<-bJkj$i(4AH~K4_mzM3o{$}R_xRc1JGWL=#5Jgnj3~46(i> zlHU5KpR~{zEjMm+Y#=(kS(YiG6)SeF%{}V2)A)jwK>K6gDH7!3Fk=kBAyFW6+uXtR z)*1KK-^3r2X_)2I!+JMz$7umEp+Z(gpfub<3q+&d8=pPFjHF<9dd7rYmehVh`t_;! zYpWE{L9Q3x&W$5tx;r?zdU#O%iS69_uVz8~q8zsT$NHEZ4-W$igM1_yJ1lc;;!;*I zGDczWIvEu^tLDG~92KckbRtROBO+FI=4eP>IGisrF(iPbw&%sN0G3C2zXvbmZx_3d zf(DWV#sY!wJhagV*wp(9$PaFHwOaQnF9_W;cAV*q{=-(`MZOC=*gf&5S8tg#%wWvg zV#RhHK1Ux~GO6{Y)7E9G==1zVLdfAx2?261bA)dZJTmcnu>Ys->wG=!f7ZiYeKOP?ksqnBxwN zzk8$WLvbyrht6DSr}W+94WBe+wEUHiI}iF%azEO4#^afDp+wCj)kN-wFcxr3Bu0C6#Yj+14lX>?jNT#Weynt zXy)~OVRPUp(Zqu+#5TWIfi{O%*+rXk8;VNQxkyqkRMK-eb z&vy#oDelc7pj_+^0K@85j6tP2xanJKeU;6*|F!7djjnF~kao-;Hu_n%oaJ%hglxR5 zqc$@T^Z*JMyQ{7fz3(ed#M-#Ao1&*evomd_5QI zv=yfFpx3=bb4qNi zcrm9F9rptH!#F9r=1)#Gmom(2OjbjRd`0#U$XnpPS*sFLmo{HZW7s}(UpX4gD7yr; z^7A@ZnBT818VY~tU*vI6Yb{(4Ynvki*G)ftvYpIa&)UxaLwf9it+=xmC_P38&*l98 zWh<^-&L_hXY^~(r6~iWY-P`lY8U-o?Km7WE)A?gn`s)V=#!kAs;lsp(1LNhG(vOFq zSw?gs*#AJb3S=v;^_jfG?c^8*IxrKg`VKO{rXTw$mH@i>%IX0(hgX!_jHi{5K(f^z zc0jUKh6jyKG@wQ&V$ng(zoo}oS>aXr^EZvWxKh6PK8SR-M8AIbACb<>zeGBTAVdGa zR?Pf77X1I&55NLq2;jhG%WhqOqm5Luf{RRj&Pxl*xyxOtO7ir;p$0K?mEAC>*%l=*?;IhY@oj zAxgmaVNswljy7K_o?EvENpF1{Vj`Hv%Vd;qNM}`BhujjbTbukTI|7d99Lb)dSjuG5 z!~S{duquHE+V87}?GkAjr!wVh1zNU ze(QByCy|k?d_r0Eoc=~gzb|% z$nv~?2f*XvC!IK1V4L+{kjIoL1bH4gst}wcUFB|!lov<^v}G~&5GTCt*Gj?S>EJRu z)-$oOv5EXfHBGLtl|yPv=W!Z(dby2dxFAfg{MS|B#X(vh?IUxT=|~-T<&i?A+{lKU z{D5R63DqptqmI_6;i7hGxvGt!BXju$jjecRf#8fm|%{a|>A^VOo>&{z^-L&Ie4uca(uRE?OXuQ{r+LZ@qM8g3)^0Uib~zNebZ23 zAx|1KN+wzUD=EiyBL0|Kcyl|&wn$J^Rwu637i#@82zNx|MpOp=WGvm#y-AD?g_x?& zzQ#I-pA>DfQZIOzjxO~F;2BzzC9T6Ge)bD88lZEow;!|zeEgUnh3wo3BUu>ByNXnh ztSFJF9JT_!fOz-FwUkcaZG^5MVpi`w3bMKnu$W_k4s8|R@8U$b(r44YSOckA> zw8sUc4jvnIWMCMcD|PJVOB}k)xqSW*0FZ39XIn(pa6TUpQhp(r%4i z_t5D$3Rh&llw3XK1=H=eyMcyS2z^@g!ScL9$A4&u%f<^nbc6j)90^FlNUj1&NZYb6 zzs{PTw>9FlfW~ZS7?se{I!Wj`4I(AMUDYOAN$+f66-^GQ0^lkN^Nz*uXGp`zwmxgX z&n3l6jniAeCeZEj`4+Y;ssW_1SaXnFe7z*vF^7Zu6gT)0vc zq3`oRwZPjc({(iQ!3GD@mpM*ira$WlTA()=3oqNz3}meV@iAKC=gshe*3uY-Y5Gjx zxTX=HTI)2l+4MWi7%oIastXYlfBI(@5!KttOMi({wL8_vHtLsW2r2cb6YTATTCSMu z?Bz_8=$w3Oqh1M@`d+QWDr^WOB>GHjhk0P|KCB?ZvHG8Quq!rYk97p2 zr3}9#e>dHg`uQyuyqxd0XYJQyB(1Cv5)Qd~o+amowPIJ9%cw$uK7s=P4DD(-rW$j` zXVM6n_<`xy)gi_8Z_|)|GBGHuq?eAsoa0N5_J1n)Y;$nHNwrF?wNbyJar}Z2!8iD- z{bPg1F?QCx-mX&R2M9|^EB#N+sqt3tqWzU>Ym|>Z4Bn{kT8C_>6~S7rd9+$IySZrF zDIkA0zZb-^`}~ImeHOs>KkEtr^YPDd1pr)+@O4qe->sKRP7&H5;V9o<$$u<~^Z?$q z?czg2F{q4gSLZSc>DnQ>TOeELma=&IAcC7m)PCZ-)fpr|>H!dHmn-aIJhvhbv0V28 ze>V+05DSo$%eiBmuU+TOJ1xC@vbN#4epcG_;&^Oo0#@+cvhY|H1@F5ftNc|Xxl543 z@R~iYSL2wt%*}oU;z)zaMxF^FXlBoLM;InMtbSsMud2z!hV2Jb~}y7*Y*B|MTD}ofFJbvPg4fhL-w0@FIM(4gE-0*jEkU^alghnrovG+ zrZrhY)SuZRv0mHtxlXHkc11&RX3NoQmKKD>cUrJF#tC(V>r0jmechQUNF_z|8nzGbdN!0QGK9}9KEX(UU(-{wdV^A)hLE#WY~)f zap>hEvWYBky`{zqP^Zmk!x{EJSjKw!*p7T$uc8iW%vUhJD^wM)*Q|~2hTJFakdhax zW`fd@{dg6^H``k@!1Z1x(NiOyYdCCrb7^jd5Ye@1X0v*vs^yfMlM;)8P>=I+71LY4 z1bm_O1P1@Og-Njt-pAu=QV_fmMid2V*iViLFnA%NtLYc<3XH`#jMe&k_-Jk|7gaJ- zF0M@Z$%qv8BJ`K&VyB^Ar&3AZoY7mfTchrSX^!T!SMA6=k%WgUzMw4KCQo?@fL!U% zI--wLK&r8_KyMWoVgk8dE4ul&fzQDM3B{{s3C4lJtl@S97#6eymO~>kf>7E$t>jEk z-#dD?ocH1qr52%k6mHVjnrp;c7K>`KeJ2IEqyeC_qNo7Nc14iwY?#vQzR7;9Z@c*4 z{Pds}uu}*C-HYPb@7>D#u659`WTRrSOqqXm{SXsbppbJgRbdsC=kGIC*C2G+ZMM{0 zokr`*cnf-jHal%PAoljPpQ23Ga=|VD>x5LkNNBbF3IP(j)OBs6Gwl%Y6H?2uqJ>}K z5VJYQzy*emZ+ru@d2Q;vbqxQ&><&D^PN)3oF?(M78p~rAhsO+~KsH!OMQ5Nu*HTW> z{HPT2y8SuMckDnY*&N>dA|9G|zV7LYRtGgB1E0MpPgNEXz3A0dJ*`o*af~IKjN|ZT zQ;SYgsiR0|L77O9&~5NViAOzbmG1(UNuVj63FRiCL!rViOgP6qRt_5OY`6`Ud*+17 z+FMn9a}qPdjv&kZG?rtAigc!|f3#ti`@}eqFor^&Xe->2L6=X-e{d}ehaPpVCp72d zQ{!;<-gJ8Tkr9El8InULZmh|+9s;m~#ZWD5-{n$){l-AA3ewT=VkUUtTH}ac1mu;p zc(IN#qtYQ1rjl(tInRo(rA-v*BF<~8F$5#i&*SexLtWfu;&+|*L06+ip)P{1A%EJ$ z336#NM3`2s1r4wqzxbBb*ENpG1d0*DwwRY)n_UIFVbs|$;}IkPWV#`rKY**)Ny@S1 z=b`SuBUs*$swBGuc5OET-bepor=In6uy8)|LuHjDZM&Henr<+z1whJlR}yklg|F|e zB)!H*Y2K1cp_?eHDuy%6y^Y_ZH5yD|tK-heG6i4YOG$0ePO2HImN`m>r`Ense3?81 zT+DQ`r-HB`8q6^wy-m+1LT&HZ>Wzm_Als}T8*ARMy! zsYpcwN!EZ}iQ^2Aau%Q&DKgi9++Eu%5@R+@3&UD?Z+4JTi~hG zf7r)oKB12aoq#v)K?7FgGD8R}8}2TaQ@)^}%KoVBJ?1p|Xs>Tr!A$2iGZZ3fVW#D0 z9_o1CddU--mNX_;GuldO7xiVwsXXzn59tWsMRkT}g3tT1zON>)xBu+3|$7%)}bPTwaf8@d;lI{NA=dY@*4u4A11$omG?bsS3_vd+6E9~^f?*~ zqAr5RBoRGLvYN%CS zxZqxirtdk3kjhQ?FOg0G@K?+k!f(s(27l-tW(+0LY9A0fVDA|OC2@ucE5RTiAojo# z>0^E!jO*MNAT!y}(@p@GlU;EU8{T83ejEFN*xUJ<{15B*to{ff&%mSgQeWKw-{|~`3-n$wfJ@ed===aC;BScc`f`3yHh85_A9-*$O1V zz1;5{b8M}>lzsJM2AeSDc*FCD^P5EOQ;CU6j4Qb=OL(QnA~4^`{iXPaJ*b9hzAqp1 zBfaFKX|U$^;a%~yS^04qGyY{t@5Hm?OJv12{^_$o%m@+=OB-k59wmbRN8MYt)wwKf zySQ6$cPF^J26qV(Ab21IcXxLuSa1*S65J)YyE{RG%N}IT=Ut1L?00h<`^$X(!5Dpa zcU50ibzXh$pl&WU@jSv@tScLo!`d>rUo9G#jg?jfOpm zYPPAJgM~6@lYxUc?R1nTvA$dH8j{vI1cyb&5ALpDglP$A!0NU&5=3X8F<*b)4(KTUh8rJZ@X4LRwKJ{N={hgA_i$XhWp zeh;0(OCeB0>Ld=}Y&>r!Lpzxg26D9{V2p|wS=&i_w{&q{zw|c00EygIE!PpIQi$o9 zJ@^anlvH+Jz0z{{&!|;}Q*W+HRtt`K6x&YEmS)?U-P|7hOkE=`ufWmpO>F+KO<1}w(s-UEwL6pVy2F$Ub-7Q(;V5nR1q%Cm?~ zIQsvor2ppo*Rb~@CB4QBEc$-?u#+K)en=>FKGv0ITJA63Kl{@E_Wis6+xHJB-W=)o zReD*SkcsKpNXvh((h)v-OzRS4DB1eOeOC6J`8II;uG*{AJ#JZ&C&6ErGJ!_zDh_Vr;i1RJnqvXIkt4J zaPO@AWsYdX;kM+T9YE`Ap&1DK0&i#2y1T~(ons?bSTB46&hk4|jq?7>G$`r91Q z2Vjn91TaU`kk^`q0rX372U;-!%n=Jqsb+1b3k@R1r8oQV?FPG3l44J!{O;;VT<_!o z#Z;$zpodcP-(8AWSYDK1{CjVl7Yf?X!R!E@arpn3b(D4X=y1qIXjDF7E8j$$Q_*Pm z*R`SnptRIEpL3PtQQz=0DJSOA+-p_w>|hRDf@;A!*19uR<8&T)z2o=*7x$hU~>W_KqR7(a=uR8%f|k0D~Fy#n1s}vAR&d#cUw~senmCQl#*Ml4&$G zKY!mZt2r}wT$L#THQrT@563gl4hr36k^*;*Jg0Vhz%9cSIbRyX<3I1Lb0VYG>2qu1 zMX8_@!2{GoS>i7Qff9B8*t+Hwj|^5)7>floA3NG_N8pa~Wj3mn|GKc$0t&C!UIM z2CC3)%p^*ono%O+8A73#(4)V*{(c7LvrWL>D-t!QNpUQc}FF@PnTBI4*oms zcMw9V$)DacxqX8psA#B9D)8uo*ME#3D>|pXBdT4UovAZwz>y<4BqfI;m(Vkw%0@v| zHW)-mC$ysu3nwV*BHVNp49-&|x?7S#%lGW^#M{T(WV@qH(j|Obu}5)Ih#sfwqy)3; z&098D&8#NWry%nqecSe`Qm#U%yR#yOIFgCGONe;)E)Ugu(YL&^kqihDfgK6N`s#gx z-KVd1GUsl}20FM#zSZLDBkXzU5f`w%r5`DN+X##tFS;oI@6lxF;>l|_-Ve8dR^}G; zsaqJ!P!HkyQU#}G#HanNS#FtdK**a88ZI&30!wGo^E2Y*%)vmTO zNXQ7_wd-pmrjMin+Ix9G7sSrNQ_rxX(5q_SoA%3VxA>N|8{oBzOgUP!VmZj(oao5R z>|H!lU^9DZ!fp6ey?*0sGdW~|gM&*qs%9XJ0`pZF_Qu%^Jo@%2=FZV~2=T{n_$bN@ z9p(8^$1Lv8#Bs70tWU#iTFE&+W?<@N^xptqrv1S>iScE|C;!^h!pQL=*@WX+#=slO z39vjw0=;$f`;VP$RFTfih>#YnC0mbGhZTm1@vf*tzimF|m%)9Xt2rt|zlL)`TRn1rfQU<= zCD;=9I>z3+W_ry2~fsrY$!BKOJjkf41cp9t*=vgw6a(F+S=VY_ILxRgheV;prE zMm)^x=Wt~pcC+iH!^p|R|I<%Qew0gcCkS@k8FBra#PC_sZmO1tE0VSgl-GnlV$K$`2HX44%Z^ zp)*)hDJ}LfbpK%`W3yuwV+1dAOW=OFOfS_j=h9saLer_c=nGd@_Ib*&z9H?(aqY9y z^xd0zwM}RTqF9t*@*EB~3#^uifs{3McwS#Ou=S5l15L~tXV}g0S8X3E*smp4M1*#{{$e8XGTWHYw!t4-FL{_rqe>Y{mF!)>*>r$0!xUR?t zugsjtEWzNLgM-(kbv;VbVsURiRdap+{z#4g5jm}HxrDyFNBIwX zr)2GyQ>O@s4{!@b(Ih_4V~Z?>y-^iL(FEIKu8N2nhi^nxTSwTtb%Gqs;Q+&vkWB9g ze-h-Ri#4eAESfI{o9r^yUb#y%IN4K>+=J#JXZvis5o4QaP6`*{pB0BO>v|xWqBi*$ zVqk_&^c4GZN)nF<;PUZI(x5TLUkeEE6)0j1`%T-&RL$~hB5Ljl`V5#Esw6ml7)W)C z*7HhrTi57at4zMuUYw)r*f60szyKHMim{)DothjUoE)QX242CIrThJ0zmR{z^1MVA z&IsV20OsLZga~xHyJuD|Bm1(&AC}YVXvUz`kxdI>y2PtC!zDXxo1{gHdu|jUH0bpE zM~c@vY0Jo9%_+q=q|cOV9Vs=WLsyJH&{k!^2h&=ar^5CD@y5zp8cNN!J0ZUD;5c9r7v)>SS)Eu`mg6PT@w3 z;;J^Wz+XTY&48&MR-=}OSj`iPuox8$Wf5ffp^eBRwn$?yW50cr!djB19A_}(8wpJk z3#Rc_U+MjM`KSrZ3uVpdOGK==z{<8-_6K=eiuTTvLv^It z>bRPg5XYq=H(&p-v|1f<}Q5Z1m0#qqnU}%wAZ`7iia*bai6`n*Mk3%Rt2;^MTKptO z+I%QE((&$QoV#Z_(4KROE>O%T_8S?O#2!v8xj064sg3U(znX?cB6!Un38-qqxoM=d z?NV?KYIYk3QUy-X2A|z5E%@~E}XntP9+1FrEjpaLAm7RyBa6(H-&T4 z)CHZ>q3z{VL|yM<8QKN2>aoPflD@=gq9)S6p0SJz43JwEWdiDDd#eKM5wccCmB_0U zFV*p7(+(_A`y$pQrg(=6*2c$6d3zR@FN!9&g5ukm zVkCN_gS>ULX`tU2!dE+Rw{yw|PIq8=6o>WSKfuf22~5uiQ&r>zpG+Sb&tNl*Y}rH1=p zE-9;8^+Qp!0>xt2&9bVEtZ2pzCd98i7OxmiRiE}<%PMVsUm<}34%WJB=PX)4OmIH* zw{zp7vf&H5Z`$2{5;wYgGnFfN2*hdCFntPgg-QW5!}jl`#iO>qNrX=&p!SGnOqoB5 za854X(!ZHp{p1b`;}&vOh1dk`w9<@Mvf+I?jL4(f_#o>xkk_;UX=f+p_=nYbk*3Y~ z+!RRWznJO*AUX2R_+eHG$1QPlu6CF0I1tJrgg>D1brYL)IgTWgIjq<0Ea%^-9*sN|E!R4Z(XcrDE2Xn4}2XdqT!j$zCda7-8LaxxjHO}vV)g=0q%g7`f}H1vgl^v zp09C70?`@tOq;Uu4?q7!Vl4CX*rK8+XiWm->X)P$IL1f z2||Ifsi4K#*3(GE*DCiBG#b?|*wnbb&#+sW_NpgeA#Z9EzH(8}>uEvEKA8T=!m$%u z-{bLvGI7{Jt+;&ey`|VC-3bP6p!4TCA)`>FcjUF|eLbwG64dYn*0udmt~SJ*5DiYj za_6`;ouixfcBCDsEe%L?KzQeP^qaehR{$X||$1 zDyVzqQYXo{H5IM2tE1qXtIwgQc`s5l(IXh)i2I4-+%G$0T~SThQymkhhh<0Hzi(!Y z4s{smHMz|)rt%$7**8V!b`&)1d5|L&Z<{lpcMRXOOPTBQ*&Uar_61Mv+_fKpOisfU zfB!Zwgv>KPuj@qu+&Z58rU3K&EUyXzFF#8+0LprJf~LFOO`VskG&!*hL}6$0CHY@< z(e98?(Rnyf9>~$r4$?orHx}|(K){gS7A4H5KFM^-X&IWu6sdgUk=pU5(@ zkvLM4hwP*c5S;_%So;0EFSeh+aGJqq;7qVr&Wm?GUf3GGrFH9*N;?IU@ zogCngJoRD9D@chjJ+IN5G+~L+19d< zeW4v_W85i3<<#(FWngEm=au=h&XGm3`UcFSKQ~6pi;hV5>FMf(TXrM}YA<;B|M2f# z^n?RA0{r(Aj#r)&5C!1&?_u0qJ?-Y4<-FenFFw|0@Cd>H`y${+SEHjZFh+n;<8uF? zB@tmzVdLwleHGsk+{(#71x z)puBfJM;xy_dK5tz*mnZ)ce1hY94t!FxjS0Ux7>Ob-{5td^4lzsYu}W&C$Bhp9gPasO;A{r zvW!h;A#KcSuvu{E#n88OdoXghFxOXXyDxSglimDAK%$fIJ87Ebg?jaKbhg%iSzqFM z-x<3w`Rnwo2+t|j5)ew6s>(|V#Uno4mc&L1AtG}R`pj<1EMJI1t{gA*1A|J>QAQLk zHi=+bP5Ezv1Dr4Ma^BOmGsKCJxDl@4eD<@mF0!%?{h12z=(GEU$(XF7=gYgh{G`oMHsuc7I|>j zX3-RyH3JYO)rw?Rb6k8Kq3yd7QfE#E=QLq)Y{!xdTxJmJ{VEWLZ>%!IsHn}x{D^;u z?P=Euk?JF5K~0Drz$3*A65inEK=YTWf58-}m5nANz71-H`*aXdn&ldTJ(t;4+8HR( zLyRyI%EywmjK+SX8Xc@1jFG$ISmmIH6WmE9!83{M0O-SN+pREZ<|5bTJ1jYAC%cMI ztJL#cCQc4HoiaxaY=)^%kJncynW=VJ8Z@TBht)?&Fl`<=oABYeT%-Xdb{Ocb8J!N{ z@Ql}`z%j^%RJn*r(MI7Z+eW^@u z+T2?1%PFGzyTIQiAr__=rCk47{Sz=&{31!~A4Gn@e(?q1UY^7}PgD;*?rmL`J#e?j z!`PSyIAm`z%@Pjq1(!V8HQQ|LA*lAB9Wun1W0gS+cxjTaeZn*J`-ZquWhlgBo5nLt zHg*&jhPxN#_k3pRCM0l;Yj;(^{6{A{?_dLj5u|r`xTrdKM@rsylx3bV13F2EAc{ff z`QHV9YGOkObueq=U+@-7{z*(_teKxhitkXxsxI52JBVz23SX-;ShvbH?%p$p>8)!~ z)kz&NZV#`K7b_`A-mW8vF32N}R<4XdZkWxo*9UGxtNay-{1%l!VALx^9bOPkk5ihl zot<}H`O_*3p2pTsdffa}+G*u0`B_ux#52?Lvt)y=oB0PI8#s&Kfx|2>t0A#G=fBA) zNttglzyXFr8U%p$>A&RpWQI)NS_IhUmR3S#s#Q=%2bWYE1o97WY({8rb&$jz zOI=1cHi)1JX2x&oQV}FzWU53vy2Qn<T-Wo_kJt%w5Zj!$6vg0s@Y;sbBnshgeM%!}Xb4WM z{My+pN!l{g`-Jn<#25u3C1{5^kh@Vfd7|JlRFGJ4lqw5j$qh-r<4TY4Gwygr97>Z9 zfoV@zO?vG{6m({n=7;1&w3To5tY+uqmZ4kFB@jDi6V2w)X5%5g)vYxyr+}Or-UJ%t zQ`s5n66TEQAOgKXm=5a<=PsYM4^_@I*c!p9%BeB^lKkkJPSwm=Re zR2SXOT=_?Irh+9Fn=kjgs0sB{%%0JZCmcn&-s$2Oo$7*d%RK5USb=4OR&PQHZhTQe zLLcY0lQ7w{Ts*`xTQDK7Ju??6o7E=qyRaXxHLcU^-X@+~i2-|4{6Jg2EA)_uow&VW%_;EU{}&_S2ruei;}W`?N!3c@WLeNnL7RkFb7Bm zNGi8cn>>L5n|_?kfB`J@Jg9RSd_bh=+hgUpa`=<+)ZFa zE_CdlH3`A};SUvCDUvW1P?Y373ZbF4SfJwbB(JEP_qUe2t~+#`vgf;O0;A?&LPRO|a5n=a!-EM~7?o2fp{;5lek7`u?zQUKE0Uo3edY z*VixLB$84Y6X&Z6Te|>dDAvk$7BmHTghS@XN%DHK4DuwtNt?5gqVsO5V8;{1#8vN} zrT>KFjEff}3=f#HEvQJAc$%{PYSUSe)AlrFOIvTVfo4xXb@?|Ygyi6xtk&2fayz2z z-&3~Yzc3*b08EIRDF74FAUF7a%?2LIZZu$-t@~ZdQ`?IupzQ@)K0%5k@_^rh0By&s1X;pr)FmaUU-$0O6o|^cn^T%Kw*Ug#vm%_)AP~NOKA{+UjJ)Ms z@>?OLllCjCl}oQtSj&<-&qEpGFF$a9gd#fjy3RntrFu4=AUY!4eLH7S#}rpO`Ih^d z$Hs4_-Nv7%gwv~-43=~t=c==>CkME~7DM=&E?G}zGE3bxsxk(U$vIHCAMf~H=kBxh zkN*e~4v@pRvzh-$HKp3pNwf$slwzBfW zMN1}a(Q}lKGdSLE?a?@+gZ>w}p7p^d66wwz{qn;(`Mws2WZo44q&^A+l!j3jxuln( zG(c*a2Cj_)Qc0tb!QYGe*oAZAx_zoS{LJjST3y@S+!>1usJ6iZYgVT58S+%I7Dw0Qk`M6MX2^6MRT{d;+BJ;fyVlU@*Zb!(5K)dLhN) zuV$f({QqtiTK~J_5E0m1@V8ZBdD-;uzxGyPdEs>I^V*Y2v|u#Al>qF?jRBL$+w=Hy zSQua3V~cqP9xrq4r-F8n&W_iiVkFfD#gcS3B6<3{@(kzW7f?*zZzmAus9HgO-k;TW zRdC&a_#!_>3VTt9J0Zi-g+bitqoKb$G>Eb0y+UBdM(JVnvsK*kweC6OaJN1-)0ryV za=~%8#KR@A0#E^=O2%H5Vqdb5Q*U$dwT!ay&9NX1Dr=2#ph_&nihjQ|?H#&gZV9GF z$I#MIgnNe!~0%brvJ>_BZc z2lVOsx}@n1NLjUi$PtN0e*e0@H)3rAn4uUi+fmR|^Xd?^vq79n0NaQ!@lDNrHN`LB z1*m8uAQVqpd_odU!3&ZCgks11isUzdP|R~++L@Er_ZRSDx|cfzznI`e_80I1(1BVb zJl28U&QAAtD3)aB-T#q^0SLu57JyLfE(-|7`iOu~obVKiHUFmr6&uij3iY23)CLd9 zz6O_1QWqRU%4r90dp->oNMN-n_eOBH&m)2pFvU$HBD^x^`+boBcDM|L7J46HczEdl z-%*lG%+J-d$hIf`k;w7QFRwhPjdUeQlMeVS=J7}%A0~ug9dJGiRKp5(6wRs z)AT+6gCTKaRUlx)L!6hD`J-C(oILztO=g=AV(;qn+pKSG}|9DU5| z%$evfufDx+{cvTp%vRp{>1VtTfgz4rp`T&`rQ?UGSK#Y|3_ME@3$*6A6SPY^g^E1! z^Y4VjFK<&GumV4NccLlYO*P{E~A;wrYF?l}s~w=SP6I0NTu+J;WF z%MvPtedVrbo6(ac@~YJq6Z9Gc?S7h3&yVHnr>qK#*6&x`Nj3VMV@HHYj$af)kCe2* zcq{6?pyFg|6?_YSdWm7aJq~0>;})+vF}4IJfIXEFhC5U8GS_Sp>ice)G$Bj0g{On- zxk8tJ7LQos)jDILo2PVAnwUzCw~gS8>Sx<*Mow8EWQ$-+b)UQnNd`N ztPS32!t~80jR8GltwIJ-uyY`!*F!1aC6jw`YB#@OAHPAYf?4Q>>49Ciz_(OK# zX~u5NmorO{UD@0SB;H8{W+!k60Ycx+WZD@WDaalcyaTRrm!n3!@qgQ10A|aJ?$PI; z=f4GVd~aL|6D1`7$nF(kf{7u>-m$q?ozan-K9Ao_IkQK6I^npP2kH1#EaF&SU8!0Y zc0+wF=UQ3mPDjE%2sKQ`tx`A{9xHX;#iFp`g@1M1UlaaxkD73GGPLdGYx&59dO(D= z%^Mvk69;7%_pI&}dm+9bcKXi=Yv} zLh2`vXrbubA#;PYfDcN?c-+V`pNPU&y^gMk197W%Lb>ZGxM;Yj*anI@b(QeyJf+g8 zAk9~zI8(ie;_GJ-wQQyb7r(*3MT(bB%F*0ga3n@7qV;Am)%u8@t~tkJgCjpBnMWjb znC2wNDJbcFD_LUAYZQ=yVNMY~qA0-=b!Gf0!p1)}25Pd${v#l3x{2?EJPL3o5=f;z zEaNy}9#_>J{n%ZBAcN(8&sLaT*1Y?VvewgdH=r2=U``5{g*RZ}|MDSI0X_BBLaC0M zcXu%ckjwo5On2|5r!g7VE6Cog#TRam%fU9C3k2V09vK;UrAK6|R{EvWl6+`VhpH!S z#ciXsHIg)J)u^hgLML(L#yxB_j17f2u;#F{BbRFp6^w^i@gpYaO$N31{wOgs1awtH z(?un_+pDOnv1zIqwuE3v0rO_kcd^@ZZL})oQI`z&%K~*(=$=W2<@$9=6e17nM@+;} zAp*oXT?CgEvY+WpU(4K)elmT=h>+kGKfsVOhXMQVPyYq zzd#++-EG~U#_`dO9**W1nYFDmoqPQ?kC>gbKO09Oihh!}&F7g_ZT$n@p*MAv#Y_vr zcv=|q>?e5|=zsxVg;EdtKWx1hg>zQcXW5U6^1E;nMyR`EB}=dPP)5Wr6h))%(npVt zDvr!C;tGl;3@WH~cA-SVTak^g4Fjaiud`H*dsB~2n|QXomLa*AzLi$@K)!|*szh`| z9y|k0(_@>0w54q&clV)KJ!TES5Bn~aaXPF#dj%hfBc%HdpAbBWPVh)8dg7gbAYE(g zv_Yi_P`QEvTHBYkA(qc3Z*mRrScGy}E5n#5oiz`J;2AP~plKsa*XxKB)O%cm zxa1Ds0w;bl&g>wtEdATUwPqe!c^y_^vqLOy(B*QY)SM~nl!s%4k3#$s8Zlg>pyoC7~ArhG^*jK&7&ENgHd$x zO+lNo!V|CqZD=8+KaO};So9j%tsoLX6a<)Jus@DaA_mn0=v+dZ<+gaZ^ zIx*cC&e#Yd(^_x5k_;>Xmcn$69dnO@9cON{`J6=a(Hg`C=m&1wrTok2rOiNs9Rs47 zv9Otm<^d3HEB>+-7pR*(){=rv0bTlY1nX7gw5eLj-gO_}a{Tlkwq5lbsE3r{s*E{% zKfxq}=B3-FdUwGB=gDJMbi|8FgZYK<@sj91a*I8jBnv{Ga()BeVE**G#{l!ooGO@} z_wH&ve~fXHvg<=pK@cRx{(6hy2sS^lXaR3A4yyAqZ{020thj`WW-=TB_lj{m2+Y@5 z-LtgCubgpdgHD0E_sRkty`CJ&&ej_*I&-ht zkl)yK`#vQS1U0jyZ3T(ljnYE}#d~n(8|!GT?xGlA%B9)aS9oeOE6g6^Ln%u|=Bqa< zsI1B|O0cA7-{%9}XEJ-pMdcz~orXKdr7Uk&isG~r^)p=k7D(;Nd`pF$wo&4?5Dtbc zfA=P1{$Fn53}~l)$r)mNKKb|LM$#bwCE_B>h@l3}FhIUN+bbD!Tgyg}=Yq_9hGYaG zJk|N5!z#by$E&eE%nR!~@#QcpTqPqPW;QY|ZYDI8S-6?(F}2$T`Jr|fTBY(w2lJaP z&?$SGtP5Bv{PJGvaiu~WapLDhhPVcV97ezNbd03exqP)_d3{v4 zYYl!X>C$pi%5NoAe6yKXOuU6=8VY^)n|4eJg74mMk3V3aZ=fHuUqWv;V9z?(L+W1R zdp49gdTR$B3Dwnf6zdo`tl0DBTFe~1b7~l(ITJlhW7BhLN_?CkdPNd*$NVFx82jcp zYxxj1+=;LFw?E7BvPv2g^E1oMr^LRK5Owhu&4E)3jvOmV5s7FJv?8&F#hZ)>^LW_2kw+RZ@ zt|h}MWm~M@>FrYF<`*V7*GptgOr9EF90_o?DmOkB#Ijx0rBu?@kKKaDCD_pZVa;Cj z82Z=7ITnT&)u&jV8waYy%2cc~{KciRi~|!&KWi!|P~TYe;9jJ(I(XCn{wgZH?dU73 z$r|~GxmZKG)zdrzzN8f4gu8EyO4uy>jc3f&KYYS+N1(0+r}EYj zFS8@clp7#ggqDx~pr)FAs;xzpT0v=Wya%*h{xP_0>J7%aLiFxTz=P|DGp+|b&Q}HF z9F%8arD1GbmRHUz2s^JYLnP%duDmMgAG2K<@7%7yEj}3VSk@qhMT&o9CLQTfheg(= z?bU4fl4S9{DjSL^HH6bG(4Jfk2_$nh>gp$i4cF;Oi-;qCDz;WdtY{NI;m_l!(Lj~^ z8g1jS@w6jEIDLu&jMEgG%*w>F@`bX7NvE$<+zdG|XSqNZd;{tnn%1!h@NQ*hn`{Po zU-L+F5j;E9;}xtG#6QVU{%mg_TnYb~uBVypb;*%vqE=?SfL}T&h@+jH1We@Oo&v4l zm5;vO9-lFnPL_YQSEXB>FtvHbMF~so1lybu2cDNTD`J;;b9LU=7sosT+(Pp~`mM{5 zx6if99i&k1-0zSY7KRs9{g|Hjz^Oz@gm?X-0Rh^%Hh_6jD89a>KRs?S!(qBBc083w z1t%gVg!369BfJ4R{vj-**P1)GI^K!PMgs9lwwKRkqN!skk?Iv_csKPdJ|38oES?|- zP13vDEQhKVawqd>2RGS?xi1{3DAnt*rWcM=l3B%R*rN866eV5h4?<|v^{udB^`8*R zG6w3LytjWW!8yH&rb&}yQ5w-^YD>2bJ}_C24!PyB_sE#>8Q(0k(2JSf!eK3nH92*L z4+Togg)rFh1uGP|Cec<2m*z|dWACpb?a3Sa*8VQj&**~)d&&^j7KS#_V~vL{(uagU zTm>%*cg(*PH2^3qK&v(2SsQ2ohiL=Atz&$?wYY6NBqbSI3%kF5K&rcxO|2R)x0RnE zcDPw%yGhp{ep8D65vMea4xviTLKB6<=MxCJ1Jh44M>acf1V35T`1Ikig}kV8^O(w$ zK#vxouaK~QK8_4{3%pr{0ukBRs6IL!ZbqLHMcBp)#-t+PP3)HNv<~w)=lEDq57GLA z;h@GTa#tFvRdzt26`R?P&XDc}DnI*CIj(dHJRIQHf&W|rtrdv(SV0dx3A$ZH=3x-l zc36V3=w)-Z8{(AfxMJw?Ir;87dBC6%iX|qb;XtVvS^@KYo&+9a`+Cr%*gPmc!#Xuh z?W2`@mX6%%yG@gCWR6mnVGG!kqUH!y@}q&$g1ABo%cI6C0XQO90+?T9P+k12eWQSd zl9c6&3BCnFj*IX<(n_Yo=_3@6sa0R3NLA|)ZzP@ICdY9{o^nBF?Il<>8QH%Jxk?j6 z*l4^530=;3{rfj#e9^1;A05e0A+L)Nb>SB6gHvN&qGrR65D3wx5W3q)6@ktexs2HPCg7?5NPx)zeA%SBS}%{B`N@^5wa}VM@}@Q4cC~P(1S` z&EZYZx2(=jy`ExqhMEKbA*;^0ATm2ODyZ6o=3n&rk+#*Fel8eG90`)iY_4AWE{59j`)XrV+AWA_X)&n4ov7-21HOF*49~^J59Xdf|ZP(@#&pnXyQ*f zjf=Pg-lQT7_{08unPB+*_woWJgZvl(Qdx=~-3XX*z|@(s`-9MNOSR(qkslU*VxiC| zh#`Y~+zd!S&@OiasW63XIYTTTN@=)IIJh09y@aiuLC9eg#D^dGx#y^tCZ~2eGb`TJ zslBoW1=Ie=K3Wf_F*rU@1b=9rW_*!!&&c$Q0>KJcUjXLvmrE`&7IL6<+Itnex!Y2^ zRfjfuH4Zi)m})Gp6n$B~vY)zo<*@u~yA29U439MD(cQukjA$$SvJIW(*tCdkBRZTW zY#N37dmO_ZD*cTD7Q`Ck`IRXKNc_66mml%=G3-^{1^~ks;HZM+o4+qM(~COE{y%yT zr09C1QYt<6WZg= zkFKnY25EsvQnvnP69tg%c=_YW#q)YzgvV&ht)`^!2h_xxQ zCDTuUB4BYRTBZbts8B*Z5G=(XFqykTwd#kYgR!JMf$W>>iA6KktsDk7#`+D``>077 z2ZS~~<5PvmM-1Oa>tqoo04eVTq^(H>davs@c8PsAN?`Y_tN5Hu zq}^8}C^`}J)$s=r5i$Hx;d&5e#^I!J9b#WMWqopYD<}=+{2Jh@Ub@RT+#VePaz9(P z>S+qs(%i};)k0C9XeLj}*tR=NHw|lwH?M=NKAiDn0wJekcEI!?<9#_PeUuh23V}TY z)sV@Vebnx%ZXv<}onxKq@}`oRF6y?6mA-oL_rcz{hri@-O~ypB=m6s4A)`KJET8zZa7sbs*|cymxLT$)=m6$9|)<~l2P{p z3pLRZbqw^uJ(d<*oNhY)yo@5F}C)`-_8Kz%PN$Acqs!~37Yn4E)sFQar0=YpoG`;eq&2Oi+?`ebZrfAI6tc$`XoVmu74&PF%UDSd@2|uGPxn&A;gv(kB|k?7ynI<9NSN@i z#6cF2I3RolBo6yTPl-d37$q~G`BMeV1&}!4MFnN%3$Vy^jqG_WnAn{A+{AZ^Tw}&< zOS!2sTD1(xBoPdol!Pb^*A*&h%w4@zq7^CE<&!Fjm&6LG9dO!?p=o{}dS~-HC5`ca zIdYKkWynEhhUb%%0Oa6b;K`d-p!n(;XSopKfb+-c=rjYS=2sQs3bECfbXq){Y9AG6 z4e73@jCePCZLiJrlW;5ZLXUvdGZ}{;O5eWjiv6GzJgCitTDmLj?}Mpg+_;f;I4T;8 z%SB!d-GOR1#^2i(KrXgSSfx#=c+m>XF3-in_=Z!NB>=O(Qi{5Wrt`KYM+xp0uTW4) z!kDhxZN?(puBvXvFgpD6fNq9m3ajiD&+37#YQsZ^o==p0KqJw|d!M|-wjR9jDu)ip z_FK*ikkTHr9}sdGVwK?T8m)Ev;qX1VO(fV3_UKuGZRv4^8KEAlpKHU^uki8>4tkfI zQQsSFFvp?gyCfF->4W7?KY)vlVW-}K0p1!oYc{L1ANsSkRPp!5vaaNAK}*TqQ-42Z z952e&n4cRzswn-n1TjI9;Nv1e-OU*F@v(&HH< z8SfM#CJqM`-N3tyX&H?9*TSx|YGd(8%y4RXn!cnto%r`J%K4&vmiZrLl^B_l zjlbolK!a9H*ED?IA!3`yLuJmz`{+1+-PXHb$EZ6tt9XDZM)OoG*|e9ja-hX%(>l8$ z5!pJpyW#G=%qx!#Tx+(l!vwwDz%V*=U%u7LA%~h4v)4`Rxy09^?;%`%{uJO!F?-9y zAPQ2s1xhj2f_GGBpE!q7E1W*Ut=(7C0bd%>^0VT~zzp4gjs0U;0i_Ee-thZnyhN9e zp(OQYAHG@l+!$Qt%oQw+4tBEQ)gu=)-S}<$bsYE{(WMy=z3!^VwJRBf6wS)3F^ zUn?Wf@RLez>g;mTy~1y88pm`MX2#FoB1nl0tUM!X_#l;$o`js54=siO-R~X2h3Yd^ z4nsg`&1uR41LV+u(OD*=rgO}_6or>`He>Bp4LnT(!nL)t-QZc-ipLm-H@SmYMPDGv zNs}5%35i37b_51Bnb8*T_Pm$bll-L`EjMgZpMe$T@zT z4K9y4kII$8h(CP87fGHhEYB~(7^#v?z?)=S9ULdn;FG)dcQf8*LFdPDI?I&gG(0kS z0k8UM(J=oJEMk@}O6>bped)ZIu-#+PEK^;AAhtP=#PVtOLoW9S^O#{G7@A|_2)%WA+5nID&ff*dky@&<8e0K6JcP&V+OwZ!fP36>Uh3anoC z*el#j2vpY)AX_rCNJgVOT;qHsKDDj(x9M-$IyUaMQoC1F4$i(N%OuX4w-c)j^*Lon zMmx;g*{<8=*QkhTsaA5Ch44F5r4=<}XegRW_?dW_# zEUHkNqkFd#Ph~PEnrP+B@p;uj2ZwVPi??#pZBY*aGQy3C%9Rfqf%Ry_|^v$hgJl=p!@H&#u6?}A2}a@H3&xC{_y!M*gz8p(Q8SQbK+ywi z$3qZGorNO7xvSW&=}H1R@5uP3JuRtkuIB%nM+v&;{0nMpCc>X+F(kx0O{LDyJMlM< zvh=@O%>M^!3oT{-dtrm=fB9G#)60rk%+HHiPlV{d(=|_EsVTh{3IOuw^wG4Bkx7Og zn3Z_>&4AB;w77|ct znb=5*;g?(Swkht?^TVx4jt*CB>09V#)jlRmP?NW#C&-gaEcAhN+Cr+KNF-!FlB%am z?ktG(cY>i9gxW}g^)JToVwpn2 zm+KIt8UYNsD!g+P(=;Ek<>Ji{(0j>4;E8tMGN`XoJMwF~StX+Ryrp|M*BTokIb$1eR!>3!*ACI z)5{dZfAHJ207e4^v&I*Rz zLX!cc;M+}X+kl8V`phwG=HU{wQI}K1K`Y9xVA|TdW2??jyJDY-( z6J>3+wSJPc%KOCM&fTrT=!;|X`Z{4Dkwk>wQ74q!58h7pjfGCos+pz#Fz;~cLp(jA zaL~vfR`ErdG1EWXn*ponM+o<3yVx6EE$#<&*_RSJh=#}A0Z5im9{(6ea3mn&PMDKD z`SpBE(_jxwjSNTD^ef-aH(f47zyRS%CGkRN#35_tBWeHqMSeRRUVxt?$VJ>XTk*%D zl@VVof9V1$D}60n8Z>0V1iZN$I4YZLUm0)en)aXVXNU%?4-2)7m8Xf({M`D>HDYLv zrr7GKK3f%N!Yb01f%m3W`5)gQcYMF7%PbUX3^QnE|KTg{65HcX9BZW`VLd0lD}Zu- z$-BoeNHNx^6uy!5gRdxMxFG;y8fUXlqKxyOuE+m{bHMjL$d-p` zN5Tc+W1+IU1+J*F2d^fbI&JfK&npDOD?Z4;-EnYQ!|gBywsO3o904q<&$_zyRuKwR zw!7j6XfEIK!?kK9K;yS*p#|O^4*#X`XEuP%={Ss;w^DTf()e{QCoiHdivUmctiLpV zeQD>I2kH-CX=b;wVvD|J1iT(7Uy{W*473y2`b{*Ol*Pwndqq@O3F#920nMsa`c`mR zfTw!r38(D0sY5B0lY$kScC$9Jb-vWGvF?bZk7U8{XX@6~%Kd5plmqt{&E0#Dh*2AY z-xiFO`9=C36Vo$^9MGBbjMtp2h}f$b%NC6&@mvN4{*Mfrx0OQ#m?o)Yrxo1+*r)b= z|AfSaiyO3v50F7s4B4}uWKgZ#Kz-rnCmA$iLpBOy2KVbRz&@27V4n&x4n)=M#75i?j%$;K-PNm`EfGxSTJlq}`@EE3D(?6?6+yAcI2^TRd4uDh4cF?DSXurOLG z1TihGNo7Bj4R>nAEe>))eO_^YM?8!drcDV>xE#|cvb6H!)4eC6(6@>=_AG6ymAf%V z(@5W}M1$pn8X!XS8+P9WB&WSHXbVr3`4%$I$mkIiK}(nt!gpW8xU_~`B{;>BA+Mt1 z^Ko8-aMoi<7B1_0?DfRY=xDh^eWi+9liX8-OD-crS(*N;93l6GS4$q0SCIux?m%$Z z=Ip<3c9s{#n}6?SXMIr=_-C7ol2rKq|Bx}HDoAg6@Zgq+k00iV4p~xXSw#LH>fR|l z?`~`3jT+llW7}3^+qT``ZQE$lIBD3}ZuZmlVSinHuYL7!?StpwIi2G_=Nxm4 zd)z-_rGt`H%>=TIecWuOkA)##$8(-z7P{B(_N0q+%ORU6wI{EjFJ{{qQLq9hR}kmG zXET-PSRs)XYY8E1nOIcxv&$jNAtuoxSN`GOpfl-WmoW{6iALR5SJzh=mI)h7!)2$3 z5b@e1YE8P2!|u7J5Y~~4OR)r$6oz7SgBwsfH@K^~J((rEt~f7?2uD68^pW4j#FXI7 zU~V-|eIj7BwbNTGJUa^jpMGKED)xI)rZKhjdg21nJ7BK1WvA%~bnh+WW(ordMd?oH zj`4+nvA;hJ^X{{cAz|N&l>~9-?2ENjY+cV<4DxN!gF%mQz`KKKpMOkrT!q^zM<5ej z8oPB>Y(vgcVuGxfP{fpoRUXc;>+51TvyiYnuP}-9{-!U4>bH=&rios-auW6f0Tw(U zBnZVlK|Zs2_uRi{B4D3{8SutE9cL*JKX}c>D_@V$;0Q68aT9C6q%SG>bt# zSs-aYexg&717^XH)B#AxV~cuL0e1=UW1RhL{)94+o+|wFpEphm|2BF z%;ST&*B2FR)_D-Yhn_jz3c4LBzc&B$zi)n40J)=j+}0F8?y&EnMLLWT`$g{fuZACw z7XNla?5~^dm(}`9;R|aJz-k?E(^>THrrLTe?a0gk$Q>io0CLA!>MwE!I^vIfxgMLS zmR2yESXLPdWfj)k)#m>L3U`?vYp!rb1rz+wtnvGpEy6!6(qFawnf|R` z7W+R+Xi=S9(i`SSo^UY@X8;+jpLVK}BCrf%G!q4--98D+mC|xYEo99{@%@W-#EXKh zJ&Jbowo}d{b7ef0z9D%zhEZL9jnPYPg9s#Cz*URl&U=GUl!F zk+zf7S-cn#KZ^K%!g)rsJ7P;J{lmKa zRk!#*_ef;;t2)jfH{aC%)417K?sx-1xlE=HMTeM|#qcece(@Ab37E2uiKTo9T1&X`1Taej2kLkswj zxcd93zgo#g8^%^#rq@7tPFp3bNmN~`L7fiY^=X2GGr1Zs!0I8nGc_#^$1CM z20oYHEk*tSkVio*A0wqT{7Nvu@r*_hrP|CID|PFoe;%QEjtT$NVN71{()7ZPvcK9J zPrYvKcc|vt`z%VSret`f4KD$HoW%1G^U(QISBzW_rH@zl;3kzb{lK}cK&u~-ia2Ns z?*KBXz`Z)vF+X;Za>ssDd6C1Q7v(V4CS%4(^@MwZKEZ}xPPAvzNubBJ*xCfc>=86D z!WMr*)QO!vw(-vSwX+r;lC<2VwzMnXU##o34zUE!j5rUJ60iI52!64K+hM6$1&92VVS{QeVSVGSyxgycGKmZnab< z!H=mb6t(hYKsDG(CCZw}nz(HXMI2U8Wm6iVPz4Idki%Lbkqe2&rbi`Q*NZ%%%61X- zn?H88#yiaLzQd1B%|RNUoi4a5X|bDb7j~!;%O#?R67Cx=lOuubMkqHQLKm-Gx^GN3^laMTH z@L3U^@N56-yk`iPGSU6Zo{{61JtL8UXrI4MO=hmbduvIC5$1l&Wzf<{Y2{k^K@e}s zXTBx}Te;7+F`WM^Qup{%q#pOv=}$Q?>tCwgejm0`0jS6TW2XQdLO((2V0xkMdr7&Y z_)lNB*w}Imt47$!ymA?wSMRvhV$k+x1Tc1d#hvWLO}fVstL`!EtN9%(eYXK(a`i_@ ziwx>vj{c>aKCEUV1oz<`u?I`Q7-TPPO*FZQC>{^e~9*FoJOlAo{u`~JB(qv%ztg1f97!!EEStLbgVU%78nWofz zH!f+RA)Kw|j{C?_YYAf84~O4>!FmvDx?_$j0r@SDuobRMP+qFL8rywgIX<0=*1B5& zJwhw!@~Y;OgA(_{%*36rLooFWq85s_(>ETM(8ZGAw@kYXANeI?Z7jPd zI2m-xcVL+gWG-w|3~F#QLnC{yREN;Mw!yT(WN1+HgK$lCh*PD0hmuQ_vd}x1qWBaq zPVUd*q~ny4-~~R6t@bA66o!w({lMHyT_q@@=<6QR62tmkBmqBNxcgRYk^tip!t>Yr z{B2Q1ip_7K$_!VzLxwVH<13=5;7uxTUGjK8bRLzfwDB_-@6-_Z zL)x_;_HN9llXPz~ar$1T;6mEI@IlI_u}^IsLF6=G%gC#k@>MHG{;kGgltvB~E8Tnh zt7#%@KkoH$=8~x6z~@#7j;gSLKq@t89%vCPboE3uPTh&v`3SQWqN-uhwW&jX+16xE^p%a-JJjcApLLRu^+Hi%4UM$>;OOpqL}6yfgjI+EIP-M<8*`w zamG|kR|NgMO&V7-zl?0UIw!=#($ao>Ah@hpD;=O{VTDUIqK3dVspJ?-RNrJ;9#Xjg zHkf^g+_|Oi2_W!_5NDctlz>P#OiOor^DZAsUb-EnPHJ@`kb;^+2NSHuf1j5sM&Gj> zaJ)9E89R|PMxEHLOx!89NBut7rV?Lz}^g zX7GV)$*CuiW4x!2YD#a}Zg;t_khS)XEY`$@2wC>XGkEK|#h-rojO>5)1^v4!J67%& zc5>*#=U>=KiIrr05%qa+$0LIDd(dC+vH}2h((9$XayAQM^<$2*4PQ~ zN9nIv{Y!R*NMe~)MlPVkKipOJmm{I0$lX_#!=x_AW`60b07%6%dk!4_UA*sh#<7(d zJC{rF5(rw50AY5dJR@b_b|P6<>18=Om~O3+UA*0QAL(D-atObiT8aQpEz7^0T9|)1 zwTLWBgiOEQq{A@EK5HSN+;Ni1&1?i3?=mWtoOjc%v&NC{(b_HDiY00$DJ62Xg}JzQ zr~=rEPj4VS2==9ae3F3iv%lJL|EcFYBirA-!&!dw1^*XY@xRAS1o{c0IOW6&bdAq@ z&X}CZvNjUV`c*;zc2MHMmgXhjqQzzrFs_=Vd_^_o?@|Zzl{>y+w`?9!gd|JMGL%D` z=nHie4A_7Sge@@+2%cs#O_ABdaz(Cm=G~WtGuF5|hW9i}I}5k&-XoY}>_UBz z^zS=WP_CW54#_4=9dB*!$2v4X`bt>dMlVX;TPJfy1LLN?|0Lkh4Q@L)a$5R+X;BU8 zv*UB5;xmC$3~u_T7Y8HzU)_xV*4>Z+Jk9}!k?;dwFrEG{nzRMuk)g-C4P}W;!+79O zY@&OWXe5hyGS`{@c)lEdyeqFaLYyeGB?|R|^TJ2=wOdAQ0ma0OVpDmv?&?$q;X=|u zaB?GZ*~e5T1pl;KeB^tC1vg-qK9+t7ZgSSR5{d?7-_5Sg?^ezm$7mFv8S1w-9-`Gv z$;h8vfmr(1RbAUZmK1)h(kX~?c7q!b{rasgS4kpwRb>D@p}8vA$b6oQwmvAMhS;n_ zk|>Ye){9^==Esn2>M8g-$2iK+quiyy)W=@lZ1a_SwaZ@W+ip366ILIfC=Z>CKeh_X z-{p`0vClac#=lc9{BE=@syJo?sM^1DK(jIUndrFk;(&d&h8BMyazh_8(iemfjWBYO zl@|HF>S|wKN6u%x;-IY%a#5GQBppcZq=Lf;s+Kco^e7q4mTja`ky%RxU+L2)hPjpq zWeU&i13wwn2cJB-#2RTN0+&Q&EWKEo+ zAY)&CB(ymet%Z+qh^nU+p|FY8Zc2$CQH(35uh&E;BQ>KJnLo`BW^1LycRF?4-q@`; zc}2Iw#d|KnQtyI8>zZ$oh0Vpm8N__ItC*HDOl}@Mcb09ho*c96cuyF42d{d;?ZMCf zhdFhYznj5k`W@1wq9A2EBmlWKL+Rx&4hox-d8nd-@fko#nykP!Nl=es#GC+>zbfn# zvpEih(7TOO>2QhtA8Mg->uUQIE-mZ_tXiqDT0>y^9BC448P#P2s&)QHK?tCN?Lqj^6f?Mu-(8{>=O0-?3+tAfs;j16rV??<=J6v7O^fx?A6mP zHd{(Uj56&ArI?;2QzTAUx=+rdQJwH`U7)+y?)Kw@5oyc*;hX=i4f#G) zhW*C6t@1OUA-k>l-10Yh8=R6wo60EYaBE0+Thw`pOV}dE&XM+Q1>tQe zw@I~ZmvUs5u0a+{rModmg)=?0Gs1Mu-R?BG7wyuYdz*?8&ecoTE~eP7&4(D^&y)5(g8>FV;`_wTtj2qv956-+|(++YT}%#Xu=K6 zhi%bp7_M8y6$K>2+>+p2n5aDCdutZ*Equ~Mz2zOkMuY|!_?2#RHjY@DIB zBlxwCGc#K5n?g(_)OJK|2v?h>C)29E5a)gsQ9T&9tLD%*#O9EUm%*qpSkKN-$Lf&O z2ISL8-n-|u>5>CSC_d$DM40-7%_XpvnNj%eGOe85DyK69Ygr~pX02P_?VB&IVThn2 zZT}%ce^t(8{x?vJ;+o9>1MKSqs&=m*g(3;7Tm&(}InYM88**kL|9#&<7lnnDOuG7* z20D|cr0mnYF!TN?^WI_YC0q?0+Lx0f6kI%+b~vC|4AG8>?^E3|hh!#pEsNsU%cBr` zy?5E(NVKqntU~T6TAK?5_6R%(HQ^*mg3d;U&h2cIRF;iT2<3E6EShPd#9eeXWF;vp zn(`5HJ=EPi=BaQ|^4O*W;)xR=oCo0R=iebuaCC95A3#V%aac#&?+_31Ju%FJob(nnCYW zWlFN6m|o(;G7)Ck@z(Kt_9g(H`Tp_>iSNL)dLVhTLHuRr$8AsP8sgp zp6`JlS0T}mKv?c6k42x=IEiNs*Vwp@$>`Sho-!V_c|fQ;b=N3L9Ih1&VqFFLD zbUz4IyjyfE&E5Ub0`LFkl)m2ZLjtk80;U=P>Vg2qv?PfB+|$&aDB?uWOpY61A3P}$F&Ha>U+c|!1N^#G~R&BxG?(VB5U6Vr4tk(0RWp~vtCBxH)u6X-`e^{@- zN+SPbb0Vg{doHrD{;pV2l8FDsAA3RbBK*h@S+}Kxg5o{;{O&^1LET{_TO=t!=-*Ku zA(^Vpto$`qk<`}%r^qon{o2-uR^Zd%6|I>BBR})rlIewC)1Ix8Mm{JkD4`7QR0Y}9n>7deN;Jx;(Mg65ju%uN!rrY432A#i9z@_lGkI;?cCOB zSxz0UDV%0wr|cd4I%QqFv`G&F^H*#6HyB2*cVpXuZL0HwE)*cy;$^o@P+3wM_g)ij z@c=!0B`?+zuFzsPm};u$*liina<}Z&emN65N35D;9=W`HLEtz7 zSs{B+%-H%<&=(VlH>;yGKzyTyk)6Lp=iZwec(1o+2CNK@#Cqxou(-IHns&e+k)Q{7 zy=AdCW*U^qqJ#SOlZ@1S#tAkh?Z!#t?09ND@iJfY5 z+)uYDqPSv0YF6E7ijb<1#X3vfg|16etE?K=m+M9NgzFTKY$9uI7ZO$KAU>?Jfh)HG zW0g7nhH+r#JWFna==W7u-(~e%Y+>7vnIxM2?(SJJi3iNCg&)A@4EUy#N#PD)fwlOQ z(iIOB3OhV1n|FP5U4h z@=NVYId??I&?-Tuyr;N^M!=vyRhRwCIC&7s>U~vV=k-Z8k8i}x67e46bhAZJ9ETR& ztOGAG^?YN{t_Lla# zd7u4HQ2~HUUFDlW9io|kv6JEwWzv}nl#YuM^SqcR6^bb%nrM%Tr?-LUq6&Rw$)FqY zoAv;<3=`9NR#Tc}l;X@d0I>|`JcY)_VL680ICE=uYZ&almvA!F)SpI15XI&_^wpl3 z6-DVO&)2Q*80?pBOb!Z;~Nw6xtwa?&XNS^_P@J^+3zhcNySE|0CI+{Ost->ZV%k0}QfjDpjb!E$aZ*50FZW zJaB!WClq*%-~y!5Fn|LH-ex4c%Rcsa5O_kTi)_(B%)iOu) zQXSBeFp;?A41-5B;Ip8Tk%X?&#LNX)ulNm?N^Xkh|nJ1^~KG8%V~k65-B#TFUm=AwQSvpKC&+YSGzo1`Z7-J>`+Q~Uxl zV|Ig^fVLHK41LP9J zvaNa68yUiLzW2oJl~@1hHl|>NB%0+ck-nn+qDh7)WVm^u6#~F1Pd9W~Tf^N@OJSiOhW5O0H)MIpJWTN75Vn-ce8%9%# z`GpZlYeA8qNCg>OBs;!%oQ{_GjL|p;1o%h6wKBE1TNGEXkAsO#==nIvi86~ys6Vvz z6O$vT3$k9>DS~Ax6pCt5)1mPxjj)UvfcOF)Jgf?J-L{)7#I`-R--5Kt+)dsCW`cB1 zFir!_;eV>;B#lAugT&w_8H4}C*WA5bC=o&55EBzoAW!I@6{};U2eEz$+hbY&L_gGG z#PP73hFE`%&lA9I+{iv15zpXuzFe1QGEFWrq0C1OR%Ir*7m2Xz=5vEL8bWi-K8Vh+ z#J8uvTSPW;ehd~(+dYlr_7Cy=tCBGD@5UDZkJxxX%ktMA0u&4gfp>YBS(5v zU5<**OAA(g15-n6!I4vG3o)cyYMF&&dpQp_mx7P(@%2Dn@t6g=sXpnos*^|7hIpmY zR7+NZT(if>r5(4^_vR61@cz3_1;+xN(q85QaOn%(@+({BPy`HxS%m{4$r(FAJ@|`P zC}Pb##j#}8GD3zz+KY%6jQ+f3FF?vED#mmJc3(`~sqlY*^n7H`%21w|k=(N1C#Y)v z3~Sa%+lcmXs)t$L8@6iWmJX^55=g4XWa+2j^wnE_d52-vtaNDi!@&v9QMrGzE}RB2 z$65MUvrmq>_m{@?eIF#~!pmKTgV&VZ-utn)*FUf?YKQjQ*oDcNUF-+o*JNoUx=f_q zfYSRnMd6%}RO5XWdSB)D6b=adbKU=TK=U`bh)RN#?cT4mi|^Ojg*xhhV)z|$v=CK(8dK!gB16y&z-;3Ws~VUnIK7a4iOdVzCkKg~A|a=N06n z+z*_g`uvX9dDQ7J6fBYFXvk6R4ASC`ir+n&-Uz(JMmT@s_IN3mS^pWp|DOYgnEnnp z#Kidfbm{+1J_Hs=l4qDj=R^T5jj~4OEFk|YLMhZ^0ToeFm6&>3ZXKpQ&;jo;#*~Q% zdlyc0<;jFvMftfmsxQDb)oGcaP2tIgoSYd_)=F;qD-ZJkSbOadxVijme`9q^xNn5D z%))2k%ST~!#saAT`(x5=*-PpKKmCFMo@!Tw)kBf3S;o#O2!SZXtw#9b%c-!HuS#+W zXYR5I1L$yisM6jsRO<{bC^aGMr*0;NScvbJcFg_RA9cv?pkH8;S6yg2| zEc4$5mX(c>gcI8+I|#VO5t;)7@OTd78HhA_cRv>I_US z=M$bt{TbV5#lag+Qg8?qj+d`4e(5$&FUhK^`lLedVDeoy%Q9LIod(aeLabeoto)6w zCbrCP!=YU2Cjn27#GSGDy)y$1VA*Gp9S;Pr*HUDZLi6N^`Euv09Sm;WJ4FkS3Wxer z6CH=}baO7s)Ro@we&3i|JR@;RHU-5Uk-sX_pKY}G?h_y)IN8O227hCL^g-9#F@-cI?6y1fi0PGE13}z)z z3|f7N7{T%r9z~#sJOQ@Y2NwV0IT|k5uOF4I!-V-#tNm({7^1zfLCjwqc`+99$;5DI1r)@Jqc3XT|^A>SyUnVm5=qGJ5E zykR#2Y(+YJYUhYg%Zw6M8E@=ijE(duXUOlW=uJ zZtA^>-*q?^@zC=V`PPf+GHW+99jH&eu_9EpcdOqd@w;bfxOA!CG_00u>Qr^y3!J5` zVp!?byjh&dofubCKfcc{(dr8C>W<8*I;&$bnKnRQKF z1Kq>|rzhc~5Kx8##XI1l9$kt--`Vil7BYp`&V~VEOWT0Mbp>J5Xh7RM2f@DC-T=O| z0kI)YTEbOA9I;3Y?%>xAME)8Z=5{w}i9KmTC7lNUSvLT)8@O;4JpD8@EsR0}GQZA| zz`p}^`|QIQ)H$a9X<(C!t))s? z5|d5~KLbB7f#%7UmRBEW0iYEH-3*EzJ>E?{T{-(3ARYl$0Sp1m+`|XU`S$_6&jcRh zo?_NZ;M-v4v}?2wv6L6ztbn%4qn7g?_uEN{*}R zbbaMwA^WM$`IG)tbxpFfM4Vr&NpU3aK|#oB8&;pZq8CnmWLzDs#_)=lR z*Sn_Sav+UBc6W8E|Gc?*qyON%Vex98bbiDdlu9)>KVZ7wKQ`ivIz_Z5)q;AhSXFMP zI$HQhekO($-In#s%cy!sla0(pEpL8s&rZ^#oLgz@*$+FLc^Tw^L}aFoT=h42W5Kv1b)EdksT?59 zz*-9Mv*qBo#9S6q?T{vDiNOguuZd3jWfyUBv}YR~i&A*LyUc;UnwMthTwaey*ARsZ z?RbEs;HxNAg;;0e>DgoVE|#|5>k_65&qIOs6@;+~EX%x~*mQ&#`VY+{L+dEDZCPw)7f0X1UxR~txci%PHp@9`1P*%EXN^DE`!LD_%}>w zQWGqvuN=`!%=F#7Z%sJEW#5O)?6-VT-M0H}=z*shdl{7s3E((#U+NSxX>B1&K8qD{ zg4{5rvL}2_iowuFs{lLu&{*PrH_$s-9V8@OFQLsCzq#WQS8g#TDvBliigYcLPT& z*n&wGCZ@2Z?OTSkAOFCL0*0oqvH8)Z2qA}qyZzDVvpm6a13(Tn!-0!cFUpI%)7FG5 z16|mGD>ZnPXie&osHGPs=TdLI{QT%&S0fXJ2F+de-O|^WhYN8IgMMdIx%v~uPk3`1 za827>mFRR)O;RuE2K{5n#PaNKSp-;P7sKVDwz%9FSQoW$Zu~LJZmvc76LLl}S7wV2 zN%SL!>{O8$qunlnGPn9D91BqBH1n|Xg1EUx6-Ek@H1h!l2!ifkhdJ$>Cr6w>Wunyh z3%<0%Nw3K>w3$CJKG_qO)OoPr&@z_9NK{5XZ0_|e@7N(6Yjm}L)iH8}a{Z(>yWKJ} zrMkIgy~IAI<3elOcRqP}P)a}&FdYl+m&}A%vo}IhteZzt6Q%UF-LFTch~U5Is9u24 zr4U8A!fOwuz_YTF=MeqTuug#q+7al)=mCH ze8Ueymz>l<_oNRek0j@Voz>0|-O>%tlv(5E&89SBV;1eIN(nYIEZvZ}f%>13$$_y? zX`IL`;xiLz48)X?sIY_uzi_~enAY|qn+hke6;slXq)j<(Fs*hWHj%!D?2t7meaE_j zwY^|jKRv%pE5GBbSk1GjTBta2v!lqCV+KZ>;AS;VTJQ5wF1K+&M#ut}kY3a%M7u$& zi6eCwk{Oc~zCy$+K*m%2c1tlN>plS5*|*7fYVwKDt?<(~d{7iO3!Ewi?u8Krvzf^i zZEH(mD@VS8dfF=-P1s@knyn;wZ1os*FU(eK(Kpevnw-1Pt~VGV!~WgoLJm1PYo?F} z{P$J#4lANfw&j!d6~>I_&y$RSLzrV8JZZIYtb?a?T9(O2$?8w6KeI|R-k=G{3pZ5` zmadVAR1LH2{e*r-MdMG6nop$iC)zckel_(_`YIcOv_6HgX13s(@%cx^M3oM$kCr7F zC+C)1Txl}VdOb<9069!up*?4dxQQxEm*mG!i61A8HRN2q8MszW`;@OJ*g`vWHt{pQ zb=UFot$iPMgEgiJm{D|LWXv$F3U}z%rFSFqo|;N;ogOYWWqW`t&#H1Ylv1o)SbPwW z3K}wJHOdZxO9UoDkG?^|LukM^P>ypX=w@kePNqiB z71Clc>|ahBOJCGcB%y!dOD4HbC)4v5scAjEAlXga_g1K1C_p|mUK<=WXUTI};hds) zyy0{6GN^uJGHuvs(yV9}=S%Nv!`uli#mJ?il28+nKCgAipXvjjr^LnU@}q1RFko}Q z^{FuLEx~U|o1(E|TZ8Pb-9^1(H9V-JnlP;dTfb0Hf`C|S(`}fWHLVYoZc>|5eO!h{ zPs%UQoim1M*{0Vq2%3Y}PX>!tQ}ZHMeg%B5G+CTC&%-4T{xPC3Vp|m5_Z3~Ah9c-x zLmEo!5{)EM!{8_V)jtwk@~J5s>3qk={T#*B@%rX2pHitLE4vNjmj-0Zclj|yKOPL) z)^TW*Bv=~@MTe=K^7PnlUTmY20hQUlyivclBIHs_hi!%fWAp)ypfA`3zS_N>N7)sT z!@S16)f9r63Ce8=eYa)!=PW##_&um(d4*B4vRII$2_?5fe_A$VFxmX{xcY4SntJn8 zRaKNBSACHgH*y0d4oM!^n0PEcPqy_SB$ni4OXsM9RJ#?P#eyWXwnUp6G-KUd0twc) zuP*~uLqR7Ea2k|sC30UY+~NW2Wj5-kq=(WU<7xj0<}VK ze$>~xZ!+6!;=TSc?Z1l?Bt(B2214;z<4lrylkOujN#0KV*=&qALDtP=*=YkQ(tqYt zkZ4CF*6kWdar@kDf29OwxX?$(UJ$&9v63Vl^)G#s+$`|k(q`oU3)&NEW%zk9^j! zn<-B$kzFL6D!1g!5Ax8x!?uJhgDUs02f}G1lM#b+Uu(6<9Hbj%Vxq3_vZFj3w?Fs} z`R^h$Y-|$Z6S25EMgU{qRXn5Caqo;IV@KV^dw37b&%)pk;dGuH8GOTsP{n}rQ-gCK z@O#j^Wl#AMX?^F;?aYLnmfy~sQmU#fW!yA>--icdW$dzqY?0OJf`8OA6_De$MyEq; zls@#Fzr$|*wa=L60TRE>~lU&zZ$_2dz2zHfP3z+f%wct3Ea-RCJ$js5;ttB-@ZlELdch+{z z?uxRV=(;Zyn%E?F!|iy1hiLcW<2LM+U*_Und+>U6UeOk2>b+I9d%WhdZ*eRY1qd_+ zCE;#&g2?r$8?!N|Ie9tsygu+NzjE_v?0G+a-00rT+9=fY=>4QP%efqw0%Tew2YQF9 z{$Vo>EG5{PWT?=&et#iEzAVEqJkkG@kPD$mrGmS#`2#Gi6>MHW^wl0V8g^*goVf{S z=f@?h9P_)oYg5(}tFK2aF{w=-tK39kCsVifRAE^}&%##{#P|zXSUuTBWbjt(w2dsx z>$n93PBHhr4QWuqAMgP>}48gB|JZjAJ=vAq? z-1^EBE~~Bwswh+njYci}-HS6+NYriw+iGicCxCw8`%DX17fhNwpY1*TxnvsmBs~WA zK-bIRu#V95445~g5y#<`UFzDVti<4g0FJsK^ewenz9Vp0QhHuRYTOKQ3W6xi+wtrBPdkyR7s0lOz3d(NDNM@Yw;y z$#Of&H0zsX_~cQH7H?XvuD%4gTZGwYMjt(q8%LPUAW*p>t36+Yf#PfmgQyDY3bx$$ z89Lbhu`Vaao!y%d_&~bS7s2PU60lc{p|@NOYI9Z4L~Rk~biE?Pr$PsnLxS8)r)XEZ zsJf?|!5;oz|^6twD%_`w2!)Yi1>Dw2oGwbdk^nM|Um>DuWyZWA#4b0ufmbf!b= z)}zZ9%ner8n@7)$1IzpvHaYr+mJqkC8fNw$C_m$-&3~+BAHF`@`*PH>+3sAwTxZzQ zb7Yy;3dIa^s^Y z_R6*;v+x__{napA3X#52Qza$jRd~=H%#}2g;T^L_FwtEdYnyyItGO%l^I@feoK%*` z)(AK9rfFBt!VUqG#1C3ry9RPlaN$~*Q(4&u7qku|M((7@lFGf6{-njmcF;bLk=7E^ z$`RaVtNN3S1$a6fBZ@=km1PXpwbh&KBjwedi!G7UnD5iQlVnXFSL3IDHcT5!(jIVb zHMt&!ZRiC;yJLEby^5(w;P;+2Pj6SkF*)-T;t)3L;Siq zl5q)gSNP~XF(&NtOxqMX-=bK?>**tOX&d}>vzUMydj13kQt5e56sHU9xr5u26(8Y? z6uRkV!f&GaMD^rpkG97&u54V-YpD9!!UXd@%ma^7zt}k}KrEnpUQm_-QK{G+%@s0dhqM`dSw5DW)~D*BaO z>ES3ls>+kp_J_)!=WdY~iZj86=v|LLj2*QRC5w{>HqRi8)0~-&mjDGB`3ec?}?e`C3moa0zNLoc1 z(5)g(erTjJ;y|2b$83ry6|%C1l=+m^S;VJYV35&;6JVfA7k6Xe!!tW+X(@Dv-c9`W zMJoQ73PeS=L`0fCCMi(PdW~ft0jB7ST^&SgZJF4(XhCMWy&F9P-qKIw%(yf4#;64&bP_Zq#+4?NOkfA9|lkVT~qInng5A zQyFQFNME66;S`gA;0ajC!&3>QO2Oy)S)3?C&m!q@Fqr_GBLpit( zl2O>5#!$+*L<+HtXQULyT>5l0?hdxXV_V($FTqIR=i&x-;-o|b2BOG)XpSQG)!W*f zTIvx(W{^{GEJk6Zm*3>+z9y+z@#3@Rd1Q@*cNIh1Vu4Oa*i^rlko61YlQSQG;;CzT8PB(_ z7>!h=1SX%dSOT}82ZCSl>KcL%L$*Z!uuOj?X=M2~e>8w|Frbaud4l%p2keltxgf{@ z@$g=wRJbAQSO=4@0wZygnLviM5T|ACDbMA7#el>`6TCTqsS+u3DBl1P0%Cijl~2OwghX725yGhwiINpU07aBEzyCATZk$Y**(*h5GsNf--LlgANo zCQlw@uKB1uXb!=d-GLo7V~B=$S(rDu2!}MvMM1rBzTD@ndlbK1gaFH-pj8M?h$Dk8 zEx;gp+YAyeF|tj?t?^-=)Hs%ZlKaeT{_v4q(M?8$@jeVE8>8|C(EjI=WU_R@{FVX1 z*J~{vvz`q$y*vta$W)ew)q*3AaH3#kAxI~E!HWzhETkD1RA=Yh=Bc_y*<_D%6AYyp z5vHCPG~cJW<)t1m*I#|+u_bSL3tWv*Ne6aYkn-Vnr-@Hdn$ON%H@2&=>*ihH)3j6N zGrftN8X>H!e>ofe@2|~uLJ}C zu_9Jx&c72~vHX5I|K?L?UBZH4Kp_ju_g~VrDu8tD*S_9T14!3+#ZM90D*a^9=F+Ilma^Rx{GM$BohXUf~E8+sx*tet60SwSA ze~dOh1q-by{?e+~_1=eN;}@{RYL5H85aU>HKdQIkY~{E#qZY5=u;#nd4W!EOezq8A zbYu#)!8MFh6U+E>`BpC!EKF$T(8@u?IubvIr%vaBde7By?i7q6sOG6!oVR@rV& z#bXvPp2khcLyb=&oTkv`G@CU?03^+=4{$_=OT(Xm=lm2oA+`jrmYz^P!#coFIa(a+gC0A94w_RNv)`(vIf@9I2Va6a*^FlbgMKE%3Z=*co8Er}uJ|%ik zD3=W2|;>gu0~ywp?WPL)+gz^tE)Wxj5Wm(L*h7c z|G05xaBaiWvb|TyL1YaKTGH>%+PRZOV;Kjgu|Ti=kx8H0WXCZ5=QrNV4mi(q(fJkD zY0W$TWzdaijN_l+IY9wVcJgi4HUOW!V_eL4nCuniD}we6ub3}a7+$<3X8#cDznXsg zcf^*WU<_c4sN*KW3n-i|!$6evkyO z^o*Hb@u!_p#=Fx`Q)3ueL726thsZ);Dc0=!Y?@MAq3kD1wrjE1A)se9gVvLmI3h1Y46%-xIz0Ku?fP6PE@-e{#n~))h=#K1Ne7FE6s!ecn0{~wad({S z4_65`S!e@oU3Ln4C-E+h*NZLxO(L`#tps_km&5iB~vw104QsQrAP1$DC`3 zDz%LKe~8)N`AM?>rpK0v=Y|I$mqa{s`Z3hU^k2EDEfSM+B=a+$omNFZes6!V;u|5i5Hpas50fo~<7EVdk7sklU zOKv2)Z!z#4N!1@BbAXGiKTog+(%#3a}~z5s*7(#W&bK4M{OV>e9-)A}lD~ z)(ytV1+A}+gIwBx1)=}+MsQgk&F1W{e+ALdg4~ohC7O=FBUHeuIi{AduA4~~R6@IR z{M?&#<7iV#ebkdhAJSX=t_LwO`EpF@yMr*d{pHVLR_4FcJO2mYd4DCm#Eq z5%cTlUjD^*_-gsWivq@Z`}&Tpc%BUgJdbNtQaTUNY(k~f4eag3C0$G91Y>N_ZOssI z5m^!qn1&sKiKoq|a z{jFYqkc9GoPGu>#!iX1}{Q$~6N>F+Ve$ei60T-sm*b!)!+KtHArZ_g{%3$L-Qf%`= za!zIL;7(eB+X>MsRsE3|Nu=6y-LdP^g-BTUJwNS-^Z{>VIZ5Y*_WL^nQPpw+Z7obi zQ!^_cjLj1ZsNERH9+3l~bAFTtq z9JHkcbO#coLQ+~@Gxu@5AjrvD^1Pe($QqwQ;>hQQZ#H}XAL`!mJ@0p2_ib!6wr$(C zZ8x@U+qP}nW~0Vxk|vEBr%6^i#@cJnj&`q|W54>%<9Pmp>$$)8ec`;$kB4sHxmQ_t z9JAtm2}uQVH^{nRV8`OTO@nbFnXjQ#she>J1wX$kWnp+>1CrQ?)H==8UA+AFlj^7D z3qqK0MpZ9L*hfY`K#?DA%~6c@J||V|wOC(wVTHrTZ~W9C3v9HDnYHmD<|#|PyZeD! z;`;C>0FRmJef1a9@7nI)(ljj6V64ErDIm|IfPZnTJN(rU>fh2d7vhk&)v{E5=it?Y zlCSG(h<-l6B^r^lm=!=W*07Ly1AS`El>C^;=TxueiP?4xEfYv~mX_zK@E?9Ad?pVD zVVU{jbU%3SF^d+7t@p#rJglYRjumT8giK94U^qKor^qLP5OAj1sz998ZZ-bUX4m2p z-1uupQVXRkHdnWb+F?Gyb3O)Axv0g|Q{r~Nz+#7L#6H{0i7Q?7AAyyR;q zDm0I=VV5`(ebvNAt&TnyFlVet7MidDU^>m^36i*wdr^cO->M8J7o=_dD;xqp4DSaB zd`&Z(Lkm4bq&GCtROe`RbvR;SVOkCg)&*xkk)P=4-O1ft+1_+Tlbu1uF7(&d?}THp zA}w6te;Ao?G|cWkLqb26=KWbGru=6BnBG;9GO+*0Qbk|%J|DQ?`2(ak9)j>r{(ZJi z)a~rk>vCO!ipecPS1_REovn+5WQ)U(1t^t?m&gK!(@f*n=npjRTTB>(70*yLFIxpB zYiX2hD)K^>OQJEawpTxRmihzw>L6H8g)hv+1S<7w3{UO$o&?4_lDOcX3U>V@`f;AX zc%YIay=xOnL^S#18`YCC$1-Bz(j*RnEYl<|AlQ7j30yJw?$i?mC(6(T>*Xp5T6W5B z8V4I4gfBK4WGC`)!?P!{!m2h=!eNz&n!tm4FI=Oi3oG=#OCX&Jl{3$qSgboG5Fqyu zm9ZqI2YP76bY^u$!4Fd=t*4o9gt& z8rxjHguy&@(Ec;djPI(W{;_W&GvoWZbgaJ%u;09{K;H0lGvuv&g%_lUY31MY-+XG* zg}id6A`^V+L9-p^iCi#@`6q(x=TLRcg#`(Z?b1g5dcZ`e_-5{XF+k9Gc()E1e8c+vG zrcDNT*6L%yQ}T0m9`w$#l`uLYl{S@Jpc z&4b6X6keA`&68_g;!>OqMpS>yYYIu^stZw|P5-7u zfnq75xK==|?{`JTu^>*MkiZaD4FwbCj4u#GL8qE(1Rkr}OMiAKy~=D{d!pc1 z?_V)MHwr`JQ;9Vdo>Qx}VQxOWR%8Z#V3;A9i>$++14y3a6X8O~bi$7zkY9;LOn|Ga?tDNroqV$YhtN8vVxG1QxnABt_t z7-N>ut{-wXgxD#wkq)QdO|;g~8xcJ|ng2M}ovC;P9P>asx#?b5+W%WY@?0CwEKe*P ztHaN&HoH*I<7laFbHm%H!~XrNPoH5#S#)#;a7s(S@IixsNo`b4T)AojUoj0%SUUDj`2W`Q2r1{0EY{aOh~qw~iyq-~=yyZZoimDq)@{1#gG-+>0(#mM<2MTbKsh z911=Oe7Kl-WAC!8aKE)U5ckf1Ilk%LZQP3AS%AM`I{xkWmP*o9eo<`l=J@9I>CN%2 zS@tbV7Er$&->Tjm-%@@#z9If{d>cFle2IJ%;A7I!=*jN`Cgvw zolthH&qHakYX0Z)%KXn`!j%If&Hiv{(WoPX?vNze4IkAmrUQ)1;r z$@r6B_!^xcmTih_{?MCyWmVAQXW6YJTMpNKM0izPnw=#KW`z<)D%17_@W&CbyIcpR zye&d0lx|cGOj~o0ZL}~i&pC9qfOeW@eed0h?wL>&yXW>dWC7}b|IZZ z7iI5VWCD1D7+T-+SsUFm5mV`lVUH1y558;JCP+uZo-$s6jX5VrHFKQfDs5+ zkR9qfxxiB1eX_N&SQA|GoBN8;*6mIl-IjxreDl?P_eo^xC#Bv1WGmb)T24UNT_0@9 z`W&Z9FBD1Z#82(kMz1SGN@<;+(UR4G&Qu3-9=Vu4fX>hliEV};N@<)bz6`u|fGZaK2yXK{U&RSDzGAAs?7q~23e8!|Q0pK*ex`n;uZz@X&UQrArZQ~9svrj5$ ziE{`sk;C%(pQ(~ZAiJu|#$@tWH%xE&xM*h+vj*Lzv5OJqA!{HrP12)xJW_S+5pC== zjCFkQOA;Lj?O}>UPFl35c$%|yHG86S_IOin*Q5S&jNjE7Wcq!HNjYK4>XZ&T@Vwj~ zh6+z1QEVw;TOUpapyp{(ETXqt4VUNz*6e$iBr25K0a@7*0`b!L8ryQBf;>z-e^Cu@-X zH++eM#&$9m_z9FFaUgDW^fP#qNMOBj!sTT6z?sEx*w`RQJ*`sPK@}l6RnR4gMhAMd z_!_ZY=+J~4v%_dK5`9HbqoD&Xuz5X0=eeM3G%sl-U*Vk?e~DHQtycP=j4=le+2kWe zmZ(BVk|$R6$j3Ve?e9?^851dA8b7;TaFiZ5tP z$fe!oca*8YJM~63iMEEHe}NYcap2SQPaH76!&LK|5gnKq<(CtME{HQYe$83V46~cx z3QsM?Rk-T@enx~CqwVd|G85E6bQSn>!h*T$W08t6a*+&;0k%#HvgfE0PfstEZPj1G z^{(skAA8+1u)ga%XZ#Oh=$mQbARYWuMYtKC@7LrvYpDIY<5$f2>AEL6DOcA?eQk@e zc(JrKP1tN1w`Kh*213p5;0M5UQKsfe#{?Mn{96{X$%8AjawDfufA)cBEe>9YFF9+5 zp0F@U_85d7@hh$t?XBoM`^EXO2N95pp*OwgbBN<2l(5q=AGzTeI$(-5Ov?ra^Lv9Q zS@@~R)<*>)wOoKm#v}X%WszEtU3;8Un4J+Ed5%on$4xLHjZxQx5p4=k^Xk)_McdR# z_zZBNYXeUD?LT4FB2+8#OPiqQQ}$hLx5H9{KK?jd{lQmSGbfmjzA@4**tgz zf<|7azNDzef^60Iiz8>lunF+mdlEsBzy#x)94>m?Tyvt(`EKY5^aC;M`7cN7U5OVX z+ixv+(6$bRfi(dGS>1Qv% zA|e=TgB@CE;vOy`R5IQ*xCFAaKkY^s-{-ge2gu`hgjH=K3Xz-wiv3YD(|0&J4)Gw9 z#IRpZaaJn=aF8>1JYEHs9fyBKSpA)1b3Ud`U}NiA@7>FZue(aXnZA9o`mfY^i;YmY zRA|9>h<@Wbe?a*i6dRfpk^e$iDS73@!^M1WGrC)lIvBHdnjFtePrQ^2`q@g@`7HNl zlI-^U0WirL?T?er_&?kPpYeSlLq^u$T+aTFGsBy!j2_=l#lvHMx`^rL7RAKjEY}0D zupEWBuk57K_2R1Hvsby$j{^hL#}XeOafsb7yyW~bRk`RYe3NCl06JD^xrSa~6-y%K z?mW;K;lC&43D1iokdE`$;D@rJz+kVPbFZleEAE_RmL(aLk#OZiA zwQ7VdCpG6(cZCJuA&eC78-K^=wio^!_r2u)7Pc2!G}>@Y_XW4~$<8>{jxzDcMkr=F zZs&csk4Q=JjMRCiC#~?4t!yf^2twNaiOX`O{aFd1?mx5&7YoihW=!2>!cr&bimn%9 zHwV%Wq3~vxiQ=S~Ca69t;NPC*OxopP}_lrJub zER!xbHPGNUV)}n_k?KtouLH7vTQ8tT$`AB*k+4i`aXVPLz>zG_SMS??7S*bR`Y5@B zl`(JdU7NXlF^bNjkaqK?!rfJ=8{1=JsVPEt5BIUS@bZt-_eR5hk45(%sHy+n1_0y~ z#xNppKO#bXkk91$5Zn}iL~9xa)#K%>hDr`1HZTd+Fe>@_IYAb0i){q}Q7Rj24}+x{ zoNzi@Xu<#8i*b-4xkxs;`B<%VUbeWtK{1g3% zOH9;4UD(MZazx zPQU#ZH!ymc+lks)IBA(p%EhHqJB?C?)vD-?REGo(?0L9De{7z^^uFOB{qL$n?x+r!H|DUQhjbnYbm~iHfg2XES-lTt9FNw}rwH878eNa3 zI$zK>N3Nh=g7JqR9?^XR9QC#5O}nEm>^B()g~pqk{d=oBCH7J1Wdk5{;;eM3^X+TE z@Y_>(h{F+Mk-1R!CCvn6WUwshV z9U)ftnRaH!&=YRvEGU_pvfnViwR_x)vJ5!aYIId}JH!dS`%CD|B4MH#5BL0=^XRPt zzBnfVqOiQ5X?plCWa{Y=*bQ}9*jI$Hlkd*rmfjm_oz*miN;!yb+@G%UtZ*%fPsbJo zkOWJL6~0iH)U~D@XKiV%J%GGUyZ@O;F)_by!1*6Cw0{g^g^A^T-yYrX23pgSu)c4M zm|5DpTh1vp9SpDIqb_Xi2BO>S%&i1~sV&1RO;J5U@t`Fbyg; zRbKZ)y~D{0o>HGFHBITr3ZQUO^d`K!c-O<_b6O*o*9(y=(-0ULI|Z7Hznszcjo}%8 ze+>Vd#hM-;((9qPoa4@>&stt4@TJ5I5_4vr+q8HB)3KNx1)O~mDV%ts!0|ajQ=voZ z1&lO_Evu(K6o9(Tkyj7hcRBBb2mrSO7}XP1fIx$}zNY88IYT~>m)TSq4)JZ)QKH%P zXOe;L0iRJEjh+V}*?=87%Dwm$75k zdn}Np;AQzAeofi!_QYgM=%AY0lXTN_%Ag3#+XoB+3G?E$L>1N-?DpKBmgCZAn(AG? z0YwtQAPz3?bR9ssbi=PbS`H(0+-)OSOf?U(v>X`2M@C7?7ThP^jyG7>+FiLlcSQT- zs@uyHrA184)EQYLnU>~Ynmb0it@5j$6$iUwJP z>Id^}E%N>>8Jc?7s!|jV^}V>j*sp`ru;j=C^WSn}_#OnW4*d|MC@%s+UYp{H0v3qN zUxil!T0id()jpLW#QBmd#@DMjF1Nrj9h_g{I^vEG{^e-=|LewdnZK3ifgapL$tkgEaqKzLq%Q=?A@vRh z3&UG-G94iav6SYh`oIzqEx^EaYSCYGrwIQ>e1>yg7UImrz!dRBxQe2R|G}8q{l)L5 zcIZ9;>Jd1o)S{N{vJe$p_r@QO(fN$}iRSw!lNW>>4q| zzO`%Qw!C&;i9{wmED4OJR$WopXBCA0xL;9$ zzRZpO0W~;k+x(Ys{m<^kyg_c?m5Tm;6G+QRR=)`{*A9`i@DOr7jJbU^WBOG{%n&Iv zXY7L3Mg^sXiKE__iBBZi&*d~0iEuL>tpz{$EyJ{Jqu={^Y%ef<-Faj|?v2EgFTz2i zI|^jzN?(R*MqFex^Y0g&jdO>@E@ZE*7ErNBKuw495J#_JgedD+<#{1xaCjkvoA%m}(?&|d~A`R%mYF<>H7;&=Ey!?QmM}n;%Qo8%gz<-*&;B$!)?UT zYcQ4?sB>jL0BY+vRx~M{f# zbYRChP7Z0Pmq?W@lpkz(Dsu+jCJ#C`-@-;#AEfF}F~^bIb(a$`bi{g0Ph(t{^@9Nq z`Wq_jDcaL1tl<-eTq-t6F1Ke!xnmH`r1-=(-;mK=?4p}l*7}M({kv2ojQ`=h`+w*z%yhoQnjt5vc%z1jeC=>%=W$%1B$i?MqjQ@b zj$^SECgbTOiwA-kONo-w2T#3u-ZmfLcca-srb5NJJEUi?b7D})`} z3}Bc<+O^oV@=^GT2LZ{HHq)0;Fiq`cxz-TQU88jvwE3+OoiIh}rd7ChX6-bF z32p=;%&>81^WnAVM%v{iLlvOJt*Lb#`Lbi4b+#3FzCYM7S-_K!OxoIkd=K2P?yTE4 ziH2b8xc{~e_*8(a!;WKd4Rl_GwN%&BaR zjcpwQ448=s)?P{?)=4x&8~3vrHV~c|1cOS8POqf?dX~1jVB&&u?uFaeXAxP>@dLq& zTglW>LNJDrPfI4eAykDS%e8*$95QJfVX(z5Hg{$(*IB};F_5*Rh3945&xU6}y!c4i zznrmmCHns#?KWdGk61qO|2r{$2K$Yh8`X78-+wg9K;vy3K)1awmO1^#&F!G*Nc+Xj zeQp-Y%CK{Y*fgNhOdzkk9CWd{iLd^(GYd`RN0EAIvGiET(}?8Q zSxMS>!p67MBz9) zlGd%{PzTWh)VHJ}=5381ya%RD7Ynfvt$wKkT#%P$mP+}RwRS>KU3NQVZ08Ra4M@>ntBMuIqjrui1 zhCxWzNPRFJ+S0&~3jo#~W;E+Nyd8_#1?yWdu0YYWuy*JuE;y+JGs9_2lKe%Xmq3dt zwfNwNOfIY1T&)1YaSB@^-SvR{88!k_w!nPsC8S7zDK@B0 zsiN8eWb}0ol3HjUocbg@z=>Yr4x-hvdpRsTU@019@vS3Zx4S-j`^#*H77SaVYqQWE zBY_$6u{(`19Z$g4rM9hLR&>p>y5bgCVV`l@OUURyc__@x?@CyiSbi&(g%u^EHR++( zo{-vo0ZwdkNCWaC_FvZGWfE3_g@_c1ib^b~)pw~KMv@iDH4j8ZMaMsP?K6)9bPzd? zF(FzBi{l91eN?Plj0bVt;t^>Sr!k|Gby}UiRV(!r&)GXCbC~_!8+a{f5(3MzJ<|DM z{&F;aR=W}crFS#dLzF$%Kx{+5i5__Y+Tm>#hwVEsRsHi#FvQNx$J7fyS1!b&4?mPjg+ggQpkg@ife}$Tq}ya`I`1<{$USSJRCbpH&Wskyq)NvPcAl znplX_2MRRD>}W~dh~(rLtP(Sfs*a}8S7rpf`Nth~7<09?#m%Ty3i1$(Tb*5$E6x>) zyNcG~H4?~mqQHH~%EQ)dwQjT35yUw)S6tiGIsbx?C=(uu@M;8I^AMIAO6dx_b`u1; z=2=4Iyps1xa$GuFxD;!$_(PH5hTD)p3qEW%cDlyt3y?wR0VE7M=ZwFw>dPJyCMpB( zW-2XF%#chEl$2D4H`(c?A1W^_;NHgZ695+GR{m;)%|~I|n8v^X!3iIiMXEj5r}Yjk zd$rF~-2n%^0e!eI1T5Y@@HkvWoXC$EpU%myIdUMjEWVn(qQ8FFiEecJlG&QBdz(_u<@_XG^m@WeEo5DKvye z-=%h;PD!H9x)QB9<13Z!rWrX*o{4KC*_XMO%?_MN$ZwZJ3vX=~FI4FD5H%k?F&C7D zNr8PSBj(1}yKhfE?-xE-w#OXDNNx!cKZxbzic2{~UfFJw_;|x!WO@kXX6mqJRAV{_ z4U=QRQBYyb0@Y4rhGl%p`F-?olwEx{y=PxMbx%{ossf*%Qd7;fRv(3n748SZ%$T$S zSG>T(ArUb2&W(-X7fa8|LMGwJz{!K!riW(ZO_OPLgcseEI!S;q77*XkDhI6#zzM*$ zLxr_vhq@hj*pFJS-{ZENuQ!A1;_o60vI`Q|o4h5t=iSEfVScz}qdrj7GMzAEzzFL* z1Hs4+oG%;K$pp%phclM3BZy>4=G*EaN2~9v8opX%;VGir6AwVye6Xla^E7x;HWcA$ z_XUoz*{X8fU38IP`#rXXw2ABajC zlx+&Wgn#0^c<_(7fbZTW;hGlJeW4-pMAo>^cm{#nQ7)a^3<|92w{~yfy@1CVDi+7? zi^i;u{*HbbHGGEpmGv5cP0-*&U^%dxKDnxTsKLOYU)gYRopmd`TKkw1&S5-+a~4~t z1V^6qRb(Gak|lQM91%mzsIo{$5m<r+U%h;4lCN`lS@z@D7ktz@RZ!;86f13PDvt6X=QRtt-*z0NPW} zBUsPR(~pTt)kx!A`2dNbnXHh(^xux|xT%j_%aC8^VTCkLb00b5L?5VMAI9qbT+ydz zerMD6x9{~oyemfXX8qxr#9{s`CH#}iRdTz|f$8THyNoS@R>>IHpesgr&89JO%ZygB zC!M4zOF@^tZJk9ZQ-#U(Ysa0$CAzWy>*_sDOJq+1f4z0!)LofmyQVj6YhWVQUue)iHmgIlu=^7dJ)`6t~6 z6RQbt)&lQ7`z5tvwC|W7!6A5pm%H2KBcf%wlYQp^a}uTz^j}s%TTMgbon^Lzuuk>H z!4&1H1tvQaK{mI_F*Vg{nnU{Xw9Skw!d*j6_``HR+Q-wVXuW~YWSY7_Ym;-hl|Vww z8gO7{o@T|#Z8^>{C65S3zG#nUJ7f_3_KI{$A+>=LY!ZVDGDctyx(S$-s?TjUc|y{P zQg0~Kxvb}H@dE;Nwsd#9f0H4%LmRD)LLgh)@e|)IFJ?HdAqq|q%a2eNH$8~XRn#_t zBJe&=UrK!Fhh+SmT{_VmREfs-M3sZ=oW}s4$iH8DI&hO-eu3UY98yS+q1G<= zzH*r+=^76-mr7E7%0X|}f1$x#I&)(h2fFdKDJ@oQlLqpZ;`qjip89#?1z;Abx9cy5 z@?F{FACv4U^Z%~h%heXwOT~{B_A&heM(3UYIi+kpNnoSf^h>*kHS=(-bxG?} z29AGl5OG_+mB0RP<*yYKN{Qn_11zmOe=G>+9m@mF+2P<%VxC*yStRY(X8O%tj7I(? zrUE(TMgMQ@D!*nbA;eMmZn-&1boSaIvONiguaI|whGub7?J3~(@9!mIAWXS8MqN-?eWQ3sjy z#=vN#B8DQd$DKNZd3}cCyWs<=hDfIRn`i`zQIL9gHY%lWO7`sBM8- znwbeTmr(rLqd3-_3tZ!G^a_tY9Zyn7QHn>6B_XMKBERJCLZJX@V#a6Tgp<U_ zDR?d_KsGqdX2#sSNZ6W;q92&sDg=zp6j~>pa+d#V!Yz@-H>k6+oCEpI&I1SGzr^-k zr8@)LZ{?wKy!5Zw{_o~>WZk9PqmonHrq2^-Cfiy5u4L*?%}yqxalAl?cmcjh*8(o7 zSyps9rB^~Ce+YCQ10JFwMY(VGaS|Z%E@JX+01U_s`N}Nd>ONRW?l+kRr9xID;}L&Q zf+Tn0{g0SpEK-HJS4uQq>LVZ$>rrfoE#G#M&`5l4b&HFcF6t>+NE8(aBRX1ZIWGA4 zFrwrEReL+hcA&9fQv8{AZe%bkg_2;#i}Ej%+(Vp3gu*<}1a^ef^g;VJQOJ@b1Oj%NOu_PY@AQMs6|b#gNWp1P6a+?V*4|v^ zZY&)W*+#+^*U&Nm{@Kk3V6(W{Z=RY4-t{aQbBzQ8YHcvG?S`Xu)qXgzS%>P6A}lS| z{lrmUE=InH5UEw6xl&;SB#3cvL;2|0bC2x#T&REPFY2UAFs6whq)U~>>YufbX8L{| zG39KTAMqe?S)+bbHy(v#)xO;$7Uuh^p&Bck&l8v9aC}rKE$3$BvG~t!ahhMcV{HZwU}17jFJ&Kk%)MX70s*xh4)cASHySP2xHJjntpNQ)6{9gv>^}7!HXHU9M&D& z0?U)Kf~lU$YKXobgY{UTrTmi+x^&`#Ab^RdLTZl_|5=7AbY?5s1&{SMR=zE9xSrm$ zpKYh|i1D5&KYHM|e0}Npp^^!|DTq!;`Cu;CmDx#DAe6^`Yd(5&he&D&SQ^bi#wdw# z#F4c16yOmjHW>s}k00FN#5Xs_XSuL~;X)Xu90qg7qEwckS|AkKax#-{y&qOTJBb0W z0+yrc<(NQPBz<_57)OO%Xq)cVn<%ufn^9qcGhLnDw1Pi(Z@!o(jF*O?OrSnBs{QAt+9xjOG;GY^Y zM%MQwiT{D*jh(O#_(kG;`9|v_zs5Vk((TDh2F4zZh@IDp}mqm z*Y!!~dR_~&iffkjlTZYXdr{HA*rW`eBO96Y6<{HP_ryG{h&2R^ZHE-jh{#^ZoX6GGNJ&?yhC)#%#l7aJ^jk5MsYzd;@)_pi4>G2l%4Pa>e&55~Bu zydxt9AHx$5Pni0}GO19HT5)1)sVaOIorL8k-h48M+jTtcL{|pL+0G*vD!@6j6g{~D zTX~A_J*AmhTwW%ut;WGqV#d-wWjHJv?73#Hi5NK3P$kf$Hi!P8jA|j&G$cgcf@3-L zN&DmbW1xFq*2Bii`d`Q=28Q2O%)hJpI4Uk;zivLolQhm2%1Jbbo(G9a&{G$|@ODVx zN?(aVtOT=Akpn_V`;gC0BaujnrYhniL5;InTkfvfiSnbd8dvs}Ij-?Kh{CcRa&bBo zaBOfPE>DGxU;f{7=kC^?(xD(tD?RNmC@|rGB$tx2Kg8py-(2uub zm6%j?5QemShSpo11yc;M9hiowcq9AKOJYj8raoXdbdRV`c(Lbr`A_9Iy4B1Z;D4gkaR)h(yk-4b#NZ$1gFeC(DTeMjV7yHo-3zT3?xTsc= zdO=}{Jd>QAcULrd9NMsW`nE|AW9jfqeIS%0`w%Zv5N%Q7F@|C4uQN+%9c*tpoI7$I za8z_}8lOGDZiC0RS$q1$YMTL82TIptYh^mFPT=pB z`g*xv6_>slv(xnIR0Pc80T9WAVMqszc;!$})>oq8)Mr4Muh{2#+=3S;OMA9x6hQ0a zkx#D6?)8!sZ6~mmW4XNS4|~VN2%733$pS?cDjP??e)Jn!-5-c0`sl|aRUGce%IiNU zo~@}b!8pcZn^sE`V`c(~2#T_h-;n;F2613)nSSncpgO8Y(@+KXG~Wczw| zXMd9>5t>+jYeQt4S`B&H=EnAWQp}`_qSB~|WF@gGy34MXHVJ=apb}5xU(5Lv2%+0oZHj-Bj4f*bA-ZUaeC~dZ_G> zLVA(9J9Dg}(#4%4lu5aMXx2SZi~;zCN|n=x%C)AtAB~kKxhPzt%~&>O*q;ZiLY>Vo zKYF@1Vm)xQn5J!osi8J{ef^p1BmYXU9#P`P@n(%`mtWDJaVy<~^c)~Oa?F4D5M>sxy?69CvYsVnDh4&UR(@oR5lOwQos9l?w~ z7uXgW<1YD??j{7m*B3>$0{srrOwbxzuxIunRb2i(yzKS>czmBht~;oSzA9S0kq_|+ ziHBhTHr1s~qG2*_q0lt%z+%K~#&0T}aZ^}gsE{7;x_RkjO?cnpH+tVn7C`H^KYSMzd*jK=} z3I+CB2xu^M5p)YQi9A#dmFwIiyII$2{4^GCr z$0+yK`Kh(oKI$z45OjInd#==_yGa201kNca^(l1DvHk1yg&F=dEZz7DUdL$Ql_GP= z(H`llIEU-iuDFJG{#Rh`M<#SG?@P8S-X)jFWZV-D=QFj()Uyy#lL#15v1NVxGdlLl zX`~(()8N(x1H33)q7AQ09{1cB=v(d6f}1W(j}G@Bu+NRI*WOnfPZWdM zYEftd$c|Q3C@tksLp2DJ+mterz1v8D?5$tv9$9uBIyCUBEpEf7R%9zOF=h>=9g_rd zCGkk|L~;jS8gnRKf+UrOY-r_a$)sTlWs-zw?W=na6D4TM1}LH`3QO(XbA3|*ze*_j zB7no=<(rn%TQPlSIF>55SL`aA`24BeNFoE8ITR)%kOuFPAfNO;D9zG*&?Y?*ziW5| z8s-FTb>K9rQ~Bo<)hDxM||V?C@9gUFYwB>QK=z)WX#Tes_{Tc_XiRqfw!MEUN-IXA;1tKBxpLu@;&A^ z8_llqmip-qftyzCrir9<;}#X4D)Zy`p$HU}N!lD$6%B@x6&}rOV?^p85EI3h#Ljhb z5y5C3(rs0#GEtQQ1WH&&?Yh&OWIN4hJa}}Vz_h?v4xV6feQGHT+%i3*HK#ZU5(V@q zB9k(V@(Bsz7^=D-*6I>*CO+^t&(`cjbuP?aO~ohS%!ZH{ESS-;T*(v7RJzUK*CkG8hJmYYpv{qD8FX81VfK5&cQyTw{^h zR#7uBx~U}Y}0m^k8Wkt!k-w`3TT+kx1!Uv;F65XMo(8?x#GRF|u5 z3JD|;Gk=s3QaHXRQD>M4+ut7xvxZYa!|-RLNb)wxNh<5YH-UADEk89-{wYp3)k8B{ zs-46^5W1}!WvOYI}}r5`snjiJ#mh5Dms* zW;^tgyRXMCVfNgPKKh$yIGPk)Ru>J0NA2(v0aZ7|%mTJ2r4i%AYp;0%q9Rmb(E&cS zN`K|I{49h8R6}*!&np0~3iq*r>Wo*sqmJhqcK*BmW%CN?W^6H{w}A~lYn)VKcu7eN zHG~Z}()Wy`QQ-(cnyZR=Bz2Vdr%_s!fmFay5Cp3=5%r%*L1s$cg3b6dawlrxsmpR+@@~aufT6ZsXd!zb^qFEJ4lI#vHnNbL zHqjFYVq(PyRN;Hi)(SX;*m7jB5EfJy=hn#IK4b())`uBkWy*ZI(-I{Ft3t=%vY#|% zmEbo=7CS_#j_ZmFzzVNjR4ZnnCHNv9Zc#9YeVIV{iW| zy7s^p(M?OIg4$?8Or2b~B{2(46wOV(i;$)-+6HitY~B>UrYI=Kjhw7y9KTJ_KteFK zCMrd=!oC?zW2(Vpk!c!3k%|g&WtQ9E!hm5>A6rwaS)f5w`rPTP{bNfa-FWvfFlkCd zpl{kT{kEu@x`N)KHE+*MJw~5oB&$ZpOju$5MaOzyjg>%k1j+ueUK2``O{_;1=Yy7F zpQxvFlX1~KLxuFXQ4DWcEO*pYUxUd9Gg-yj9E5L>%faytbEsUD0Av^v?Bo2_V(Z&d z7PEBbmrD(hd|E%gG4VBMDgZN0viW~B6`zAP!RaG2XooH~MMGUDmIPZu+uFh*AHO@y zmJ=nw+WmwTUQ2KN>(AUcEv*0}Z}_MMH2_{v{uOr>5yY23RxZ zZ(#S~b8krO4naGEl_f#&Nap~o+Yn=q4uW z{UVLn{|Vf2ZaCAfYsj@1$-__l1%)b_>sWb&^_TYRJLiN~N;5a3Pjn46L23SpBnBcC zjXWmNcTyzjp+$io{fm&-x4OF8rTR>~=_^&=M4c-n%2+A}@GG7UL;7{J-6S?|QRXUz zGOIHS2gm&~N7fb%Les|2QD>6vQU44W`@8g*3{1bZ7PWtOOB^vH0~h?JcaaD8?H0($ z>^r2n_~=!i&sGzb!V$kg@G81Vit1ET9SNWhoJ0%s#irWh zA{qCdk#!3B?#jyMuT>(jGDT>pQ<^uo#NK<&f4L>zDK`zStv=ztxh0OOsr&zOODyzB zA_SCe_WGAwV#1qSqQfP)+ipnJf4LI{bW`EoNd{k~A7!1<<$hFP#@fxaRTR7g%+A#YDAzs z6sI95(IiUYa(U8AOXi)&N#b7M#QBEghwZ?n&?^;t(`m}b1^qo6`uTap{$3Z$KuFd%EM896)UYWzx z{RCrX#hdnlr*$J370p;mK$g-abic}n7O>6uP}5hbGzgkRq`cp&H3C(yZ+Cyf8ACd{ z5V%JbG|wNdewMfGF(C7-CJ)kpl)y3Wf7wKeV1=UzE;2tV1CH72j>S8qwNX3P=Ea#k z78CI7o+VMgVI&rpr51g@7(ni-0fik4gzlPamn{w~Ijf!(TzgxT$k|bMfiMRdgwCg+ z2A8|ZsM9)qlm%c>BaaROnufJXd@+?Jv+7Y4O22bcId#*)-zAf?2R7Rl#PgTa^{xgD z%kKj!=|pk+jbEI14iK7L3Iih7>>LT>ymg-p>-qYIx=VH@-{oA#NPNNm1M8gn@}iKR z^OOX&h15PZwd8l1)ZMi#(nA(w+F4g^0(I)fSKAT-jtiyqayDaYGh zA+7klOd&^(CU)}UjTki4+{-zVc8Kv%9eqUj>1?`fwx^ob7KX>s{8lYII}ZKO5)VT1 zl~kE)?8I^}*f_BgncW5ICLe&O56n2BtQcL+oaes>&OlIppSsc&E1W4i>bbyTJLs8< zW2j;M3_8$=q^zP;$Nflwpb21vn2Xgp_wfDV(7}oW0EsNVZ+~eC#(N8z{<9M%pIRm1)5BQp!Va&RL%J9?o#E^p z@me&qTc2%8^YEZPBQTT)&ygJwL+fHTMIKX$t8VbP1YF1&91^Rsd0# z0)kYVgm9GMp4I3zSOtom{->A-u{!{zHlV2jFiTRM8f21L{ez)rRq&^(1_P!^rI-9- zvnm*?7ov1OQh^*5*7_k>@Y0FVxYrbYjcHl-&_s+;Ac#zsP^s|mwvWZf9qbD0SS?y2 zd=1TgpWDn4{gXhT*_exVPre?C28LV6{#04l-X@@~KYZEDFFSbq|e=ss+i2}7?ep>!C)mtMEfZ8tDyJ;C~ zEiYupHU@qQNMsd5;yyA6iu6#MoWP?%-Hl4l##guiCg0G{{@_^5gadG@Tj~FR8lAhI zM8|o%tVsTO$_~n`01(vcDxfSPV12lo9xiL_lh!;|EzoNQ>&|QU3&3V3Oygh9_xqme z-}R`{v68zTS*;6Zov5+nj?M&y56KzJ` zk6}_^J)TCZfI-mNlMvLYwm8AU1W{BzLg)jEq;1MpkI^X|1A~}T)E^hgV1|c$+Guh~ z%gDn1`KjvZR>YBW#^)?QGWdTn_fKJ#1Wns8+P2-(w(ag|8`HLJOxw0?+qP}nwr%}A z&-Z`V-tYD9gXeG`RaIt0My^_`Dl^u7M?}NB1%Fa!o6GPuE$%+L0iLSF|Bw6jUq!Mo zviuLARXFzlMzZ_>twGuV0XN25*HroWHTN*+h3_+MRVGtk$>`gKWe=K{Gql$HqK_ zVod@=R+m+~bcKSh*NsXO^Q}9+>L2~~H?t7m1S~&uvnmV$r!Y!4lcY9U18v1@{5;U7 zj9E>Ny&QN`ttZIn-92ZWH>iu*Nx0oACUk$>X=sQULMwQ;fSxl^9V$nG58j*_YoW3< zl7+h5>R8k_w-@|IpuQL{5I_@1xU}2%Om1p_{lBOtwl!Z2AA_?^;D627;achyE@di@t(g zd40qGANo7kibv*J!8%6(9(F9DVqR6ReztYn$=^kyANqS!?GOEZmGmF|9VEbWwtbs* zNF&3KbtDZ8rL4?c_Sl{#=7QITq;1Q?0`2T3C2o50Tw%28KVbsrDXIUTFoB=y4nJW6 zZGb>x*8h8l$U^^LfzSVcyUSsr|F70jX8Ql(68wo5xBCgE6aHC8(f^|QBb@w}E_B=7 z@W$#|uztQ$>oIAdXJUAi7Hyly=I1yORZq?ltef8+%5`8ddM8b(9=d8fQBlyZCxiM#r-EJ|gocs9;TUiNPTS7Ta6uzjw^lWG>tp`T8M*+MP zT0c{9+wGVr^7rP))PB|Tdmp`++8TKN0Aa+$ISt7uLL_Ehj9f`dh<*?pYUvuYJI|H_WgeQ;)S+cJK z)Sx>OhNS+{XiGrFJ^8@<&TAw~YI)!a@Ni0x;x~S^mmg5Sy)9J3BA0y8gx24uXGqH$ z!2Lcb8O<;dI0#WT`oRN0!!XGFWUsrRdcD2(%I%zSi$2v<_)-gq3=vS!q}5~!Qc~g3 zP{Fc+h`87($&#a#*mIo`wQb)MznJ^+oDX zIi)?(-?CG$6L{kZ>cg{F}7+ z=)xXuKG`Pt8@mC{zK7SE(`#Z?YN+M6;5)M#GLF~X{IfUi*KP4BTTg90YnQAxj}r5i z+U2}urSO?sU$^(WnL3Zh_v1~!jMLj=H@HwF*jK4;%oSa5ci(n0UIZteRF=V#2fb6& zmzrRzy{wsEHtpUt%3oD%F~JA7r}*e8>FuOxNTF9$Ud{w_pYP(;@{`AaZYOayEnSIY zRoz~WO6;D!3#$<8H@}rxicAMzN}J>)3e4je{S;5TS*fiF$}&y-wF3-<<%uDa^Vqy> zU+q3)S}H7iKui-q5mgvgQD}NLG7Co$LoPusJbhnI1N6Tgp zYOQ1)lS?R+SRWQ>Ogt!c@#9w z6i{s-x?Gd1z6C`on%6Fj^{ch;7*{W{b5(XgIJzLIM>YR+FDgz-1dcu@MxCn+8(6me) zby|DC6w%aR^Ci$E0XWelnhQWvzS{KA6;)kbwWJr=oDg~5G4ohSK)0Fb&;u3S)pl9& zU%I6pzt2YVkU_)5kWZz34|D7bjR3~kLmU=ne?BHkkOkS?I*`9vs!}I3fH5BQnK>xE zKBxzjEujSky@O4;T4_s<&%NkAHCPJ(KaVXT7EO(Q!MP~?SBKY^8-6~o-v|@-XzE%Z z_B&0~^?`+{&q2H?;X%h4MYVL)i$GP(i>S2yVS|R|)of>+)Cg?+#faXrJn6FZTTKvv z#_1%3Y5)_cM!rO42#SZ8-ZH)t6)PwcBOsKUA*F?jl!-_qn7lV54^*>ZE=p=Q_7`X= zuxT0;@`n_hmtQn>ZYE&zOxCvkyN0EA_@zzlCrwlL;8XL;SDV56Hk$>?OYAbaJOzwY zw-p*oM_<#I023uzg7Q#_?orupDXkov<`~i+4P^V;Dta??1~(r#&+?pW7?(dYP_i%8 z;J{UOQzgb&x_SJvIytzXh|*9VR8SClIq$uDAw7Xu@JNe2b~R9kav%U;hyv|Ev`3-! zVvxicNljHJkUg?p1X;QzcSSIUsVh){{D5tMd=J-I&AC_Z25=I6WNA-!H7?m+-7)P1Z0jtqcD zc*Dr8pqDCNXXa$(>58oMT2MiwrD6P ze9+s0(ETz|74oKd8t(Txo5##qhn&No7_k^=@Lfxj5rdqEXRhgg4>7R9Erq+%MJAMz z6ODFE%z!U zGLP!qbk=<3Bq1Jyi}SF8yjvvj&R8 z^XAtf(-uk6<_7L`>t|C%9B5za>nZc$F&!3K;ApP<>J5fTZ_5nQ;VMWyA&1X6kb?mY zqD2_Afli1O5p1>8NNLpKMZIhABJNoj7VJJu{i3K_&JG>Deh7HjQv~Dq{9$5k%HO)b z1=czc_Zu}h;Kj3f^pIw&Iqu2e(_;b-8?*Amn8x(&m`A1MzEo`%kYeLfQ{D{6IH~I9 z?!KEu6WbVC3P+F-^VS@%mK^=+15M~d-viW%jTl+6s*BmN8?gspdPoQsbDxsFTrCT7 zF4)6`!-X76*GWgRDjDr|o=Vi`bpg5$@)5P>5GHe}2z$l7dy(y+l4oJAlTmpYT5CRBb0uMC%^8^Wl=Ccy zD`#5z<91v>JnBo*YXud-gH6u(-8*XzCh0A*vCX@xBkq>5%YAD{%rl9q@!t(2d;5W| z@Ttb^>7>u%dr5z+`_1zn=W;ICPri^VJ9uc(Y@4U_H{|{G2-4|@R(rs*Um%>`ck)#8 z4u7}o*PLwrcF_#N`LLe#YjcalWHlJ5foad1C|V8ba34dkJQmkptxafO)DrPGS2c*{W@umgbw2 zj;cqJXbcrP(Qkp_pnaU=02`Cs4(PesSHdKxDCPl+T!!+mUkg)2cnZ7{YnDOvfW_Ia zOATbnxac<_R!S8;$<)RwTP)+lVzWL0x}u6i?VL~FWSM%aI(6-poF(Om6?-3e2&+%L zGcg?rp5s0QNOoq@KP?{Z({GMqZgBwDqCxU)}Jc2!(CmSz#`}CZGp@ueRF{ zy5y9TD*=<{5;U9qeH2Mh7;k^JOrxeV8m(%{*%KPv1Z}E`r@I}U%82x*Ydt77Tl)hm z{XlRE9`1DK&v&;by3vcAt) zgmd&!FJC?UI1kx^FSUMMF|j4u@>?n9h~g zZCS7Hv9~2$K^QfKUnO?JP0?Sk07bnfuR>k8B5qiL-c+D>fqSfEWotO#A9?&PQnUW% zlDWC(X!2T7^zmz&Z;QizsQtMaBD zuNfF%0d*OeL1&M)#xcL{a6}{M?k;D4qt}PgPqWj-v@PWlbPyvK{BY1HFGGY*V9t6t zxs(cb+J;w`ii`MFqRqpjqo1L!jptn1OGePk=RS(_9XOk=7G23?fN}H8Mda17voVU) zAVHZcRccX5bXTflp86+4336g|?Y7+gy8SW&^pmEcAf-f&bv1dnhw$i5a^FQ^>J$9; z9*oIz3Azd8ShSbz5PA2qZ%|n|+%S=K^0+yxi(qEG`2xpV*jd^s?pV&7vAwc^Ewx9@&R z`Ui4j`Ofg4uh28)n|splwufkL5vTkwj&#;r_lIa)>irk)H_>QM+Yj8&e3MLeujnr& zx)sZe8^oKxJ< zq=RDUzptf&f`MgkLY7H%{{@PT>L;(BG2o$dHh|ro?rL%&|defw1FMP>+bz>zc;+Z z>+C)r7j-nnDZfR!hzl>A2za=R^~+OrKkqm52jFjG#WkbRdj*31%;uqpA&i77u#fj= zouJp<_3PklFNXf>Z!Ua`nH!tCUx!~#FIXR+Ux}&GRPjSGDAf^|{_aXjLkGp|Ju+A~ zCJ(AK(gl>9EN#7@7D3hb_8MUwGfwP!+ z7dM!#{+Wu3shk{4-I)1JXe4j5!dMSG5A1;yMqzUlE(eSGPNVDzCn7QEw=C(T$nvCS z<(&fRH>9Az%v>S{iUP(=eeP4iQjMJGFk`i{8y`o8G!1yBJibe}ov#e&nckTRlZu8w zixc`8)657_kE5XGsJ=<%h&XoBO5vmmxqWLew9WWNPz@4-@%EDW*{->dh-&o$dA;cM zX*;7vgTlJ}zseK{U=^_!KX55=Q|oE+pi)z4m|Iqjos5H&3l4Yh3CJ6Nd-s}@koQ>U z?tCj`B+v(412!9N6-PIQ-oZ0wRL{o1DBYsa5CAkAwZMTM0YSyDGAcxD zia9At0Q3+dn9F%&MN*9gv6A=#S>zv-E7cY7^(x?h7u+QlW1KRAiRB_#Y_ojK-!?*e zDW>^AHmm=hq7K*b=9n25;|mYgOH37~zzv53q{xA&j<(B*+L~H0-26D&K+EB1Xr)un zG@B*sF0oXGm*q~=f-e}70-k0pu)zmyc+)RmrA<8nzyn^Tn~$sSs$rhd_tN~!Xh5hC zYleSesD4L@N)D{vCouq;&xFf_T4n*(XH~>s|A4ra3Q!53`gj5=yASzr(9gFOXNIvA zWz7%lx<7mthA`#OL7I_{g{MIdLWI&jJuKz(@B(>(O641bW= z90IhuZgd!5)Gb$5>@7dXb)g|s@Cr$LloTas)Cr|Vl1jmp>^F8hfWnUPDfI_rPgJJ_ zq|liMM9r{t83?PR@d41nX>2)m`>@NN;&9YL<&@|qjVt-%L^k|)P%bdO)gACh1e%vX z#Do?X(Ug|E+tcNA*XL?8@B5R<_SeOFw-`;)ikgxn6%wA?@j2F6!Q%EDjduJfr5 zkx{>oq^0;}gWJ8dWOAL1d8Ea5&Vmaq+%TtBAAo+Cye=kMDF|r3>L4)=QlV8>N^yM3 zBlZlDzao}MLO-18IRKC?eNTKJi(^YtzjqllSO7!%oI15KxRZ>PAdKEFTQBr-jF_OM z%y1pko+zB%S~X}?O3(}SRn@NWiyiQtLL+{;Xu05+G6~_oq8MeT@nF<#jAS(2`N{(j zWgC8U7R)laB7x#;)w$t5%f+XrnOKY>P{;yABMiU|h#nZhi4kI$`S5hX**vRe0MnkY zmpMnw_$ct!AU0>ahv&P~^USH;Fm&G>LNABo)xd~6UDzTg_6ziD6a#u7Zet{jgb6OC zk}S@n`u3;-CC=K~<7^0&3hZSQB}K*6fs52`T_fi&I{Fi zN_Lm)+Z(PTMr9eJnnco(ZAPb_O2t$PI29y3zqPTQJ6^jGl#XmU>x3k)(Fz&%)Ea%Q zRp967`!Z3Vb7?bMQB=l3i>cN|f($C|jdMdE#U5*7R3cJaoKn;UD}Uwa|B<^eOQ%(@&TPQ6Uy}By6=F z_%!f|Qh>}adV*{8KRjR<%RkoD`rVVla=FD%;VwS+B!xw;U|y=S##b(HuB-Ky&L+}K zja7AHonVxo=T;JSo~_n;WzZsbsA;Yxaoq@_>DXQ6ojNlppq!Yvx^6D0Xrj1i)JTwp z;d{J&h)9T)+&${hE-v5ZDT!aSNpf&_`v@#3tQ}#DcINw?(M&d4yR<2A0>)Hc{Mi#h zNn`@|k|8y*b&Go%`;JQLEYi+RO70q=EOy1kf9g-!zAF8TvMkr40qSkZ09r4L2;MQtKJL% zbx@8RDEYjt2|ZfGE-PlxjN$M2Jb(X_TL`9hl4)`=5&Yx2;S@kVINU^m#AvOv4FcPG zwy^MRPj3_5*f^VhSkivBRVYI4S`6hEk44!tHN=yDI|p4t_+f*15vPQgAfgU5|qHkI~;cRuMXgv~3 zR^Yt6tYBMfF#>vMN3ICLxOKRFpAWphYR`W%I&aPEeJN2Jn-}S?r^xfxSJMUV?k^@Q z^S|)+FCv@MBWp`bIs-bJU7vzdE5=u`;>M=7IzFqa*IDU)Q+7X~=>N7{!ETRFaJshA zE-0*Gf>x5~`j(O(o{T%uoJ=Qi*0Y zB|(pJX#$3s*INlHF0h6Nz&JYxK(!Wk3YyAX5cZ|Ow(Ft?#|Iv8>n~e2Q40vOWN4rP z_QX;MJVrfEZk19OU0Ih>$9=RZD&r}>nlUL>3XdW~x)M7Khdpl%3HgDS#Rkz=KB2hn*I_F+Egh4zv zcQ^0=3tpc@@Fo-vM$W_E7g+oquuO^R?^$W1eR zRvNtF8IdOzgq|lMx>rtUqec9>dziSmJIrs!L-Z0uD%gz?50+Ax_5yrfWg2igMgN=a zN#N@J>6eM z&3vgVcVnJse3wP!A_b3?=KC$bp#E}lKxfh^v7&7v1?(_!=_{YG>d-tG(SV|LRaqZ`!Q zK?d{K=BJAk^;}K@`Rl}qVrtuux2-$)zIiA5>f_&#_u4uK|3r>@UNwHS>FB>mKW6p3 z{>gE&kN#^bE@1yLc2Y1_7?9G_jm!U^i997S{WDV}`%iF9^PixKC6vLx$$jERbVGVK z{PFu|WC@kS8~AH%5O!$Wr(3_1P@CO^?xq@2ZtCZf@VWmL>qbTD?4L;3>aSy++u-@; zZ(wJS2j>6n?EP0^t4u8av(VV3)_T-N3!>+B^^84$g=;qezt7{9OLja=4E*0ZERZK4 z+b=vZ)IzjX%14xTt;*O=gMQ#v5o+zT3_`UIQ)bp=UjKj2-ck2xDZ_h4|IO|FX*XGA zKgLZo*3odrq;AAGQAakIMP5G{ugB~1DW3N)uV7}Ug(39Gd4>FattiUKCG~|W@Q?Rq zouJd*ahqa1uiAc_Z!Wz#)17Q6u*WaAH>wZM&%ToJz5@p1KhOrlC*5V_25^+HH}k?D zsX%DqP!@=txSu=u_5H`E9KIC1yZM6UU@zXkI>WT#Uo4Un7KMu(qJ+^h=Er=gqqc%h zf}&G6ISb=yb%q%1`C>mN&IqjTtXE&kzni2rar zwSPDsBO9rOv61!3}CZELFxyuyZaR8+`Qg>CgeZfUeeCD zy*wv#Szgc>NV!!y8B{&=;KgyDu$5@Bmh>MI*`z)BMcKHvS)j|0IdU^TwTD{fkJi(? zCn9>{m2eS}(&*fUT}!xxA0*Fg0?ijsSXIUa&$uf7Q zTob@UgkUV^iB_p558^DLAG9oAI)7<)2<(&G|7|#kn7nQa9Y%>Wci~n4k?A@N;^p+0 zSDxkGb%Np1W3hrKCaCExJ2huGd9nQxLmtR4!jyVka)ZC|%v`*k9E+faxK_An>gZ}v z920+7S>VNh(>7rmF~ea}j4a&!$@3OXH2yeI2*AH!lzoO#yQBY-^ruc7#w0@~4MRbO zMdcDs@}Gho<4dYVFdI4v7$ywdTg%;R8p%;Vg1IL2SsRXfm;fTL^>c!ONzhrnw|d=4xLyk3S14zbxywuGG|WAM9_1u7R~anj+K$xY#If z;H$`#0ljFAH}}=zs+aIxJ5?&nXdiaqFS8dtL%&v7gA~-YZp#CjE1+F7?50pYGshw?w8WP3;XGqL`PfW;mKts3B?8d`In~mt zcz?@Hu@C^y{QK*C?pblck-$!Ku$#EWdY#sCMWP!XRNoSM>PkCKp?>oP7}H>)BLd;X z2eoq6BS-+7MLJQih7!=^;Jrtui82~6G8~Q15$E8;OiO88wR&1=aIeKcKv^1qAF!B4 z7ws~Otor%#@Vi$otYWhTgfNTvh|Cy(m*B*p4aW+p3JP6k%kX;qH3ul;`F5LA*nqDC z-%`a{xcPW}Feyy<9KZR)G(a0# zQ8)m}oU|{QS*OoP3$n|oDpe|P3pvF%(%si}bnK(0N=X%3tP>K!doQO<4PSlI_*_k( zLx+lFMQd3ZseLD`6qZDawN`%?dwYCus^`R(Y-6$Ff|Ck}5D35z(~mL?0u2C%6M}Ks zO9e^DcpRS)4uMoD(in$BS>X=ioy(xlx<#Xo@#={u4#1~HY))|ixzbSP zyjFT{*IE1!f?+u^KVet0O<7|0i7!d5m~Ds5m-U?12PYeC63|4*pe6?3DARgQDj+>g zuS`ySf3D*FbBz}XO-(<@5q%6enY<7f%nu%j!U;m$o?~Ps3C;2kJR^01xb?9W_#g4v zWeE!GkSG>xQ{=k8A?Iv!>So~7%Z|B!MxsDp;_eixT77*gRX9TQ>Vy0j?ddBb&)l(X z;`8b^ap5(x3L0oZXfHnAqe}bcf0D{C8=v@mU7`?+yF^PlR=^57$nqev-ylM7b#4Jl zF0tKMxkbZuIqUUKJDdNme^n;4j)aIq#@dpaqV`Vi_2*4sipQ2phE(?A+W;nOh&&>_ zB4AEwVs(Ho;v&@maR`_UptFePGZ=5?8i=y105n+9t3q@lZ285>6`RjWeYgsY^+d3c zq0U*_*+nl0IfaXQ8Zu6+c*A23X z%MtMI=i;(yLa}}i@ixf1waapRjL=gpqVk9+qF-PQc4BuuJy*^|fK!Y|VDP99T=Eq+ zKEM^Xj*+UPCC z$hJbF=d>!Ib9Yo#hQ}CFpEBW4l%(0U~s%ss`)g0v4F;wHMBKf?50?_t{DuUD$19?Y+P@-VM1z8D)8dYnn^ zp{uW#$`&VLNI?C>1q>t*a!F8SM-Ia`p~QO5oXA=G+ zb-&vocgd}zvqhaRJn`>e!Qqx@tow;nkyh<}`XkCxEo~wKj4W`cfH;1Fv>Wwh#;5}k zSLy8EjX&TDoAck{nk0wmLK6q~l7GH2k>lH)Q`?zNlpsPs7a_FofmA%)ke>%lKREi= zq$r5~nh}^reQZ{59Ms4xA&x6pyP8cbrsZPAs_)(Tux$Y0_UsnI>(TRf948V;tka%o z%f)YbeHmijIeh!ssLnSJ;9C3_RyGe2Z$}nAJPomG)Pa`uF2A(Ifm5#0APBE~0--Y; zt8z6v`M}H}<5bY!rfmRVw>gG&DWgx+bwzyCQ*;H0@ME}AXD5{|nw99*ul;@=k1QNz z{cbZ{%5$%JO}gQut~nj+#xZHA(ZFjdK<>1rC0Uz1;`z`QaLA*hC_f>jfkJ+xSAF=z zDHThPMS|2`1}t3G@lh~j`AN-CoECS!S%Xvu0lg zceGpUc`kZ!fbhQb$JUz>kTvg}Ni^59-ND(l1!&rDM8|F4JNC0gjuN+O)26oU_+f;d zoI~Uo1D6YlAN@X70iV)BqY{mfk`4?2K5|)k2&Fn0c%$?fUJ=wKry=XtXnN%8+w!Lm zo4+<@i7xh8h==Q^Y*M5SfD}8_8_kQ-?W!(%cR}rB8_n5DXw^db9v$~w9SHn8>w}!D zh*_ySC4*Jf44Z=Pd&*KLmQJ`04E3Bg6~ksU*O=Zn^H5pJhcD(lgdh%b^?>u))^vy^ zjA?1yd&t$I+O;-i>)(QGorf)*wiyIxutZRA%XWci2g-{a-@iw;CW!S2Y(+Di*8^qi z-6|P?XKzOyxenRXRScQKo4J%G`-tQ|q-Uf`-6XYTBpxok?2+FJi+x3R~1K7cE%SxC@NB zq9qA4Sv8A$p$neU*#bFsyzJK$<=-bYCM{z=qV97ZFq$fe;sNtiz=8JUQ#`M7j+W0~ zEFJ=;f#v)|V2FG$B8~0jUEy3q75mny5?|gBp{KO5Ha|iN_tynJti1_!_w$~y1$XGI zkEMXL`h#Gp+Gndkr%5FN$QOdIEouhN%daE zXk}Ds58U2+uGYbw*m!E(`&I0%Si%05aYvA6F3-Q%k-YbLGNDV%djPYG1N4&3E5?7N&WFgQ%3L411aH9Ou zCAxd36b={2`$+!4R?+djk^i@KtxIrMA-Kp z^}!XfA68)r*E*12=t>|%9Hagy!?N7{YYYN(34~Ul zhq>`CeyaH2mDxD{tE7}ntp77n`TxWNAHRW7poz`umaX7tz(<^#$>Ts-fAGMB-v(w6 zk-=#kY4y@i#3R1_2D2!yu}Bo7S&31v)5Is&>8)=z^!ib(B5a;-b}yg!h3Q&v21SQ+ zqUdCWQW>XT^k#>!TA*B>pU=BG-l<;stZqqT##7@;gZq(+3@2(9i7Vq2pP$1r^LDq7 z%l+`Yr>D!`IPx0RC)s}~8NLp0oZs4k%?4VTZJ*@wnBAV9TBb%LExe?YNimmZzxyo%o9!gJS@}&<%>+cU&89FYU}iro8}E(Z64c#^ z3}aF$E3~g*_%Y+z+g8E$7Y!GwJ3>+gHg9MfmFnx{)(2*%2IvabrBK#}rQ}68Qcbr` zPgrIrup5#XSeBSJO){qy^Y8q{If8JTHz*=bOeV6P#_!=DD7ZRkY-}dg88RF$15S5%`)1!p$`9!*D)HtG zBhVI>n7n{lTv(Nz8Zz5r`4sLr_LS;o>2G2TuHkrATZa75}E2EzmgnIg`p>ds@5Q0mZ4tWMyQBH5;l! z*^o6OdF93)MNg&T{3VF<{80Q4GMGg>`nrGmcAv}s8LLRxADdYwIC9&{aZ_1a1fi-g ze<}v4?U*dXUv*L#(3jVZ#4MA>DmlU(w5%VG6cm0b(Nk5aDd67QZw4`gY8~Yt$OXJ& zrdaB$3YHDDGLNqW+zw+r2s)OdqIt;tJBX>66Sly~v5Rp74gMz^XK}x`=@p+CvUOf| z?~F`Xtg9*b9%IAsa_y(1r8myH&hXR!J$>eG`nE5Zh^5Pw;8!VSr2lMETdE=4w4mEi zR)W5>l7K8eI-6=_v~@a`Pc^kx<}v=Zizm3BMFyH=g1U`Fk%t5dBK)8XOSG3_U&pVe zhMGm1C3A>73pqlPKnmsCu{6Fw#b_ojNdH zV7T_NLlnAJ#DBArOB7p>+a!@DyP3Kc2Ob0SQ+y!J|Bfe15_tsHEUd`9HTu__8S5Vk5w{6boM>DmzrEXazN({BJ{1VTJ$LRbE8LB4`1>US3exwd9Jgv!2~{#2;S zPL0zpenlc{~28VHwO+J&^3hS(v>Q(ca7+vaQy zn*m%N(jY(q*crcMxI zTzgEnkb?HNFUar7`)*c15q3?t%CPde-cbypXy?^Wa*=%!TKz_Y_!iI7nD|&QXvIak zZJ4?Z=<$NJn)5%3Ab^>GdT^q(BFcO=o!s0-2ZO7rV27TFlEIJTLtO?x|pF@iU1 z@*Bz^{PEoeufjH$4EJl=?Yv-|wj&3t5V^*V!szLd?nmFU!P<4}^j2sx@ccJ>52^E= z60TA85D+gt&a+mjvqL?D|2ijE{06z&TF$U_gMRUTAnseiA+Zt0AWtJG!*}(eE(=`6 zaRjTF1Okj%9lM?B6O78Pghe)?Y0Ne*F72%l)?^31O+(JWB(4#b1WlYl+td~8LJANk zE*QcC;|kc86HyIt9r<-)FowltyP4@)ru+odBH~iE)OG}u^@cILp~~!$V=#nM*e;Aw zAq2dkp@%S0DVX!MZZxRUeD2U5K7+aEG`F15tuZdf;F7UXX z4qqgNBgJaSlVY3}c<&7D+?jvS1u-v|VxAl3e51hTG>Va|W>X#f*^9eJtL7RKTyW6! z_iNrzYAF<_b%GK`+E_Pep!mCD9Z-ROMC?MslYcYRUU|~8kW86}1SFIRA$2kc)r55& zq{Q0H8GE8H3hAB@<|%#iI?#G*c(W-fT-K^RBHAc-toU0HxVA%gfj~*w87%oK5~4pR zZED~WtV|fAfvsIFF7!HdyHh+9bo|P7mh+9{I}FUdR)1BD7u-oF&@RX^DCSWKVdi zzRm)+=*DX~>hBIZyOsglK7lU|31ArhFj1s3qB{IZ3^3uS$k1m;aZkQVZTFmU zc{;E_1IIZzULL_S%B2HNnnQsmjhGL3HZ1|56i_HmJBa(R9t8G64x|orN9Ww|ae*ni zQ^5c!-_D_~iQfqq*6*Q6TI~x{2erW6Wm4PPIN?tsDs9QVB}#j-SiY6C`^Iwu*()R6? z%&w(-_sfX3LD!Qy9bkTT@yvXuOu8N?ZSEd*=sNv-dtIgMY}?m>714PlHfHWbz-X`H zU%k$+pfjdEHntE+H8s;5pT+S9S%S_Tw;4P~+bA6k@6z&k`>h7IAJhGz8_@tgN-okN zMcFYw#0ej2MknA@wo$vk0PvCH@g92j^Q{hX@4l*n)&7vc#((m4Rg6;6&DEnbq{|TP z_GCRfo-WrxQYvqO=T{mI1;fx;cbg<)i=)#u{lj|UDI9peq*rd+Qa_!o(oKA&Y>S6H zxe_Vufde=V*?r)Z)ZvU3@ss6BayJ4m$K@e6`J}rvB0t1^nBR8e)=pF#@({XdDT+z3 zspob^Wz@~P_d@V4P1j-yP{OnFYr9W?Q57QTdYz`(nLeLfMRkcC_?;==5mOdf{;f^DZcQ&^dR4H;xrwhCz9olITAum?w z&P1a$wj7w)+sik2hE034sO>)#L$6|2vMZWxxa3#+Kv4;FXs+Y=PiWE^ojD-{yTqOw zb$^2tOmMiIZFDYtagaWYac8~(m#L2eblYy%L19pAM_X$t2UdlAS zbyts+tJ>#ELw_Z>G#g~zkSw(EeiKb;5XIX5`BwU->v9Yg!|45|b{vFpLp+zr{8gU{G0b?irgza&f}*15tmZvlau)XOkQ&Yb6uRev_P!UUYGS%B&Op z#cjgf(G*+|cb2?%@k(#autHVG+|`(%<3zkbT1|I?2>_piSU`THVVzWq07 zl&p@y%09*6fEjo{u8eQJ{4&Oqi-e<3pvh0`;wyO8kBuI%cPg0n--Q=lSGqr~M$vZv zWGUMDxc`h|57z#yC~c^YsB`iq-{GX2f}=(g$q zGu*1I02owWT#z>Q4X83%u>QZ0Ne0IMF1(O~gYo~ndda1hWHfd&V%K!_i9JB`ix+^O zPv&Bk3!XWqk(gBpi^YfC`O|GOiN%VW=#(T$tHewUWG65$Cfg!VO-zo@r}*u9$86{xtbJ<3@XO2Tu+L^xNYN`lHi#HRjRs zqJpN;NZ}kup_B z@}!hHtz2FPe-=Nh9^~>;Y>I9e;U6k%7Vxwb*yDx0Ne?id(uRDfBd{YTboz}x@c@8N z-=Ye6wAUm_wubk{!aliMQu;|k5lT_uU3NS+{CqG|>t8!mE$*plyHQZc#vXCfz~|&S zsKAMtMItoMeotUFj$jPfn3<_N5}f^*Eudzm(qYW>wYkuEzi@4wy66?T^6qDd(X&Gj zjc5Aa!r{sOly-lGEYr({aLM$3YY3K%37J8SkxRSskRnyePF?ERrQNB?>isDKnTv=j zqjWA$;ULb65Me-`Ygm}N>2*jO!;}}gO^l7DY_#J9amJsN5LZ27g@x>cG_gF?Eua(^ z#)T5A4`YZAj41jgkU63L(hO*$^ZG=nI?*m26i_mIx`w%UA8BZn@6Y|8CTR1h!@DGN%MS;&xR!}?L zC<$sss)N4P6CmbL9+lLkDB}dBEyHkEpR$=tO9^8K<`L?w3s~Yv?dLA_kG&A2Jp+j^ zduFP@vEQ)F`?Q`J)C{{NF7pZc!?P86tl^9~Y8e5y3~dAX`F#$r342Skd^Bi%>xg{r zm)5Xq08FI1WQD~EG*Ll^GzF-$(6H3k@$)1*0wCWf6o)1Gt;Dd&F(0g&-oFbAo(mK) zJJ^$w5qPVpJZhH;AdAuxP{aqRR5(yt4U-k2;y>kQVUo}!M;{MaUWpTT584%L?CFZ< zvi1lX0I~)nZP3h7b#u!Pd{fe7pjKuI?s}vrsSEkc-6)g<+?mS@pduBA4kRyGjZDub z@T9*1E&yUh7C?9-eX?bVv@EJaBrTfro1?dQ+}=+v|KAg<=O;Y%c9g5SwL%}N4a^iT zD{BiezYaTpnsu7LmJx`9M-fa{QWfmUnW28EX6JX3e-!oJeP&)05WDj;1b3P7clJa1 zD>G<@)cmo9iSvXA3+MwlU|}c(?gG#|4VmegLg@Qc)FuVhS5RHMK87ZZPLZ1b|da&ylVA5gd*Q!hm@L>V-YCX2L z1b(Yjvyy;;sjKk;F*%4^bA+{9?cj0Bi9`(t~*Ik-te>|PfYduPFX+?`%45dQw1X>7{kkOn$yoaSr2 z8G?!^VhIcSW+-T@3^ORsuS*i_NzGBFVJR+4vg@f*LJmm+?n%yJ%1=+3X4Rbk%h+IL zf(ky@(BvBP7h=d_vM z4h^cZlHYT-L97o!pjlbQs>h*_Gl^QnDg%;nDg^wJBxNyGd-2Kyo;pZVoqZaq?Mb&T ze_7;e8xlFx*|M)L%FN}5Wt4EK@;zo>)Ji>cvvVLWnMRewFO+AMEqJFEhXRJ=&^mqr zDzbFlX{0_oekkq|woevQlA?;TL|4&vU_Y7e#KO4i^4s+giL(|ONrm=YNpwbwoe17N zf7aTijMif!ArZQD-8W+ka4oqf*j|2_Nc-FH-v(I3to z{bjDXFy|QSdHFo^hjR%V3mt8xg}dX+@(m4ymOLA_ok<2^J_%M!Sp+e(w67OEXUi&d z2}jl4JRIAkx;U-tMJhU7gO7pJ#n$Briymf+H7-1Ta5I{d4ej!3%T*F0F5w3wH7txS z+p+rL)8I^_%@|FmLA!RiP0DgA3~F}F&i#yBNyuD`-Ya8KqC@bPL?okZ*D(TV5Pj{v zS~igQH7j0I2H)vcZ@*7O+810=>WX*uuKAIlbsN(w$wFCRzHQx+LIZ*cF^Z$BwIeUpW-e zOP~}Vf}ADI5=}yen>S7ULby-G;-t-}G*ZhnWy~F1;HQ-AIt-$71Lxk3;2$WA8XmHl zRT;AoG2Yyi)|Q4z#;m_eU=}dzOP3tV)5yN05h2ZJO`%{$L+vmtka;VbpQp zjNLz?rn)U!mYf_~0d*TAoaXrw0_UslVu;D61TJbpD2O0a4 zF{k;H-Os&S(b-7C-M?07Cre5^eVYs9ax|fVru83hUzHvN3oP^68A+|Y&kO30`u(91Ct=_f8yqp@V4R1hN+Remi8Em*{E zYN}6FZx!UnY|lkVDEDwTlIO!%h3P>IY7GJDAE*l?wl!eG!0|y4%wl-1t?+^RcHrrjTuh*|WKEHn6&wqG>-@r#lOJJo8wY$te zzww04!ZJK{Exlp3N(F?1&99?{gxy)KUU=KR(xz5%CN#h;McAFjvk%V@D7|7s~AU$5pvuH`{~NHj*0q)c4T!{+6(Cek+~ zLt8S%?Bw~{FIvQ9pP@-%YI9ZY|C*G-h$$!y6-l5@Zv)~D-FJjk&=@R(=COmc>r4hy zhsD20WmI7Rri3=~Bp@_(tqqrT>LOtBg+DkV)ogq!|K>qAkPHBcs?{{9ww)l5EnFXj zvtg6*vTc@Dut8DDU$_o7I7bdf{8}v^qbblbZBlirPRqUFn_Y60Zw7&Zyubv|k=3e^ z=rb0a#NKyHCN?z~pxa|3CKOr^vet@7ASIbp4Ox;ir5_n$*EQ6fMBZbYY?I#DdT&^C zTOKrp4NF4=mMgE{+6)=Aji*=`HiHehmm=ZR>%!Y? zcpdpZgXzg8vy(YiY*+$+!wIN7XnXa2jY3`kTfm2uS+&CH+yx=my`xZ`RM%A)mGXt} zEUl4%1^)NL(_Es7SmJBP^s0m)w>ua9>xD}73iCq>Lb*kOF2NmTD3vuHOJ_~wKWQ32 zoJ;5h?AB>TB!Dp*4o7%aeMfINRtG7%ksP_{HkO2%(jwau_6iX-LG>YJ#;KS z=W2SWV2&^~-JZLPJ~7FMlT<@Bim?e08EF4x%@NPHhBvKax=RNb;HuZU*J>4x`6f*f^oCawYge6S&bIc*4~y2?+-P~;Xe=hQz5?6ajLVopxJkSVi|eKp zSOt?f(yj;Ab?Lx2p-1WI+!JwHx+eo)+$SR7rV_AI+0y~R^!2{4sZ$k|wO+5PU?;h= zrZ|NJ(~YLrBnf-)>$Nm>*2$c$bXHs~r=eNA%{+4!z&RyQd!hhJuVbvFE~4;`rWNQy z^U4jpFro+yirp&(kq* znZzb$gW)A8PUHUmiueOAi`+5aUKfNfbn^y0{f?X|;V{Rv zDgaFt*AYj~pf4J*28=1gA17S7LEP`xPQ$)R|EDGO<57tv}!P67IRE>?F7U!k1wU zeECau&r1JWz~lc|Su0kC-*SFo{Im9va-8HJvQ~e{L!#RzBJ8VrR}o-GN={Yod~r?n4)stdqhy9L81Y6Tk6xgzB%4+Tcrw=~r(-U2OS+7=>t@Gr%N)$xB#>yc6YOhXu zLU+#r65=(_rQ0f^nH|(Bh6R>FNqI4+YFXnC^E?U1&gUiSh24a>VS@*ax-+w)Tf=Ei zV`CZVv7d#4-W!O#J`_J=N;~jCqOI}%5+xSa-%`G1Wc-t++Q0gQ{-K>0l;BGrnBWWl zmMeqLpR`n!qZ8WbdA+WxAO*xDMxXXvpg!tww-yslz_*%?MtmPdy?DI>L~N%G)Yo;q zS@~%lU;Kx4Jm9BwJl4Vw1?W%fc+Jo%HomkV&d!2^n`=*s)rWt23^FnOyT_mpFrYQY z--PM6IujGepWHR26*xY}D9qUdly?u)9-+MFv@s*4^T#$=PP`>mKM0-g97nMf2i0;Y zX<`p8J|{O&uGuZtrD9bD@pNwopCegU+9Q~18KA}_UrVzVS5r#6mPPvt2*kZB3>Ty+ zA+IE@E@@TCy?9;j55Q0$O-atp8d54`tI6mUvXf(c;h6##>VY;;U*|&d(b1F_X{whL z!35f~F%qSdM(hkBgig7m!WN-Y>x#+LG-zwVb2F6dUMFZ3+SvMx~yEg1n|1j zfng`atr(cxLIV5^KY&H?ZIly!a&!S24Wz&RO;i5Xbo(E>T(JC}Jscy` zzs+ltf2dssUb%g;Q2e}vjL{6HF=P)5!q5oe zIvavPZ7+GW;MGdNz;Nk$~9Fh8S`^NH7hm5vhGoPC-{WvcR6m#T{1pKOrigYEs zW*2a|^&li8lj7<32MpXn3rFIJVIksiiR3~Z1;cU`5&~U%bQ0-q=aG`J$7P=E^E!G# zzE;QBwR z9k~!NtZ_9vOK=sHVvXPCK76kGD<0<_x)=R+y*e{ zYPbQPdho@t`76;~VSQi0wH20}`W=6+#|2N7G#Y5KePfrY(1Pk>l_Dcc-tPm8`GJ%! zfz&rYZNk94bADyW#x4XqQ+h)0OoqWjf>J6HETS_pTs@-lb@XVW;2S03G}j*f!lqMqk0i1A7Codx_qf0K4l`~k&MV64 z*APDtOg(I8_yQh=o{}+p`P#-nP$0<&ZLC89C#9-h_ZrhUUOT4D3n??t$OIjlb^TO{ zBx=*>6+Y~C%at71)Nr7o;V;Iwn^5^Xnaj%O0IBJ(WbX|FV_VU5)~O)`e{Bu+-x8)} z{IlcbADfVWwK!&C29 zCQO_Y@p)IY_S_~?AH2*lk&=`IJ$r$8HC0C`q#wHFcG|&u%O&z%@=pz5K}E;T#@VeM zoCFaC>#t;G684fnKcu9E*pr}9qQzxwmCu>UV# zz}SClFU9g_qY7mu@hBVynD*r__kLj1qjBd?N(dABw;vW_9E&F$Fk#oG#KMhH42Iv! zJCc&maq6VJPa0_slpRL0%Y$)$di~JwZ6&>V(LR}9%uJpfq{)I!;ROjwx;Ou+d# z-At~2Ua&|p^WD4#&ho7uhlM?)fcfU?{`^g>|N9`8HJ{$pGl(aD-D?-~9ym9kgLj@{ z*~c3o52u-LGBMRN$Rb5XdOVLt`YW={&aWO9uFO0?eaG)Fr&nI3xDAzjxW%s1f-(Ff zw(3-<5uk|@vug@uVA2e`UYJ8Ev?OKie3tI`hfSI_dj%^624-}s0NELtm0MVf*F3dr zJrFD0@etkBYYPTs=K?=I#T!?1etIdB=zUQ_ri9E3vPYO9NzNo%Fy(t#!`NM5Lu>by z^*#9lo70JaP07>-t!T`UUWCO1?K`Bn)}J*8TihH!^5gSQ(!oqv?ChNTnPzi4Tp_OXUtZjeX%k zV`0br4v-5A)l{w$-pYYJQEv(}xSl5?deYpY^z!t8UVe4t{x`GAZ>2U&9Dj0DRgRa8 z>nHfMUEmF(-JzNR?{#BjNfbVOUq1m`uSI8|n=$`tu&fY?_{ulMYRsB+TL(;b74vjqPQD_Lst$oWb5>8OquzZQG&6!=9O$*3XB+XSlEpc=b zS!I$4F8o6EPVl&ksoTz}6_j;L8h*ria3u$*F*+Rc>fsRNYStQQ=8R(8<7Qb$(_s$| zQw$pa`K(&{U|{#j)7qW|u7I|3=zvxe6~nPAv{T{STF#xRCE=iLu}4ej+)BW!hQRVA z73-C__5{JxTy06Nls_4AJ_A+wP0yhll=aBdas8q(ycUqpOkLVITSJO4>P0FSQP1}R zjJnd>K=#fw!3DQmc0pyCpiySIfuEcmw99D<`38X_22nFJC>&9&AocE5k1khc$9FP8aO5vC zMZWgDpwX68?3erWdV9imuk)ETw{HBkEjfM*!SRFcUGK=IbUjm@T1GTAI)9Pwd?5w`$ubM!vWC<+hb8bL;&&l=L!M)xk3=z zar-%uS(lv~&k2nDbA>Rw7Ni7t&f4I(g=#lB^VooX9z$E5g=n94NOo)vypBXx2$Wc0 zQNx*&X2aFF49u)3zDg3!W@ z`J@U&Mg{MCF=Y;ek*nBxba(58c0gL)ZQH8mUf519*y|5alP*|mc8x;4HTV`-k#rl= z?+6r55hCMc2787%*WeN-*t~2~XE1@b=t_P1ahZCpB>R&xS7BmkF{CgxtuXMM1u)^b z2Xzv%R4+Lmb3qkS=_j1@Rd10l-T{ee4z)X~seq?A`bE2V=)%TpAHoKs=TSX9X! ziI9x`iE4nwqiYH~@b`dH-X^aIwFd9J&K~a?hOr(n&DnL8h@VI6FbuX~!&~vtYptQz+FF zM#Xtvx~Vo4i16(op_h(2>}@KpF)>)Xp`Kwx+-$-f&&8~w{t1hAjCvt{1GAGihvN%n z0Q_;h*F8(O9((9FS+=!htUKsSx!r72^2#%Kh*>RO6&e z_ZaZ%!JVi#{WHDXE{?WzD+r@fY*YEeJ)y`Z=jOzvoLi}ON*(wd=o{1G3!QA1jdF~Jnm z2LkGY1mUteo#y&`dcqmS?F8a>Q^&J>ju1>z3qA=-~nJqeVDd||InN-KE`-+gdH9c5*8 z70NIINDOfeMi8Jm=9?F=;>dK}skQAdOK-g_$FX(TB1+KjGwS*Q{Lvr4qKPfGuQ?^| zf{h+PW}W=n?C~yR>?6W!0r*LcZ)eDIB~J)a=Byy;{Wc-0iI3dzWa%MmS_Epu`*BF{ zS$TKH*lcQ4iROs+K52k518GcM*Rv~|{&0gc z+YCdit3_MaFJxz@pY8%CC{}VV6Vm<|wPKtY5EybWt^|kV?3{vjeF{RxV!f%plncQr zZL+*v3F*1emmxWW5(-7&4Y(gjX!@Eg*QYJjeS8sLRQ);^gX!-YknKi#wJ3Bb98q7% zo68Uq!WjlisHawDWlv8)te#zd0qDgJ{?$*9h4nXA(0?l%{dYM${<9oT$wMe9O(n@& zQ2CE?IPQOy!_oh{9ImsToTLTvJhkPBp>J!5Y0_OIaBSyD5=CA!H6We1Da8qqx?`P5 zEJFjULjg*_7sn;4qyJ>-741Q|y+Xu=rT^q~5qFt{&}AnWCKuWU7B19wQq*6bg<#kV zS1H{Uen!aP6FSX8kP*iF-o&uAhtnXi#GEImtQ=sT_K$M-XNuKofmX&*d@%pRo_6)( zk2F_~yS~LD-3SedVpK}utGkXU|0(N%h|MCDQU}Ionp_3tC zpr@x(a+(l^GhN2Ld8H3 zBLIt|K*RZQV?zt__o@Nw*i=={(1y#~?Dt39pCb00YS`XLBJ$(L;Mbxmy;YG zKKkp>y}5O3Q-FZ}`t@LWGNkY?KM*l=`rCWYo0N!HBIa5^hPUW3)sio2agYM^Rt!OUGE< zt#Tr)tBSGQKfSIjUV)Y3E@8DKL(VXfZGL`)N-{|u^(=vOk=H0mIcdBC%4Libb&c^X zv3AT-u2J3)b1r(Ngg-$Y`XsReLm6OJ?-@mhW5AIzAdUZ1uO(9l!2gHp^Ax$2TvIp4t_HuX?23e;!p& z9!$EoyFHxlePeuex?P{VD1I0oePvmx=1r6BmGMpuNd0x|bMNy3#P$4uzBBp*#ko0~ z?WsGpTj!VE-Tc{L^;tJrHJ@dbi)y8M=^mcgiqrJ=B z=T0A(wX`v>?j>flyNdVxy~Cs2CE#6Q^1{RWl-T^&e68KG?*8ee?4@pPu}s z`bkzK`3K*oZi+@UOB?4G5d^kO=omX?GeE;%n33e9W=yAaG;35aRH(uEA*f)7X3y{x zFm{bE{!$oUbyGq}?`OGxy&Ath@4r0ild;~|N=>+7F>6!%&J}ot&ll?4l``)GBotk0 zW(08{42v?g@SgH^<7C`SC)`)UXom!_l25Fkrl_4_M7^D0V3+8O78sdhlPY@MgA89G zo6lwCS>->_(;=ga_{NmYAwk?R+UfHkNGPWP>Mun@!|=O$2YALc29;u;j+c)Yl`r|I zXEb_I1UCWU&5`sylJDet&kC?_kmRXUbv@}DY_^4hleaG}&1(6^pGZhb?ie<#aca2k z7&d>tVC`6X*)@Fq$MM_F+>3o#UmlHB#~K0R8nU!%vN9OHdNZmE4kqps1$(ZFEj#97 z6ft`=QoIeXrFx?^5=oqDK!=teiRArKD7~23r>vnkMn=PUa86g)(het;py}KxO;URC zA#*A)D+hTEs9@=y2~CKWxAto?y<~L77f6;TKkj)(8(FB)$=AJV&FNDzfEXHIvpnTZ z+b8-USVg`Ui8hD!Jm?@-jamRfr$2fVQF{88$MHcmTi6Hr7)&GjInd`!AgWFaL{l%7@k!(_NE5F{VaO^WZ_7W`p zC4k%-m80oujUV>vv_BRF16A8EVU z3kPtxQXz-!W0ycTM323Ub=ulO?wM^)uq{p-+;pT8+9_S5x; z@?|ItBe_Ckys4{@t|N}!udZ#fSFdjA$NX($p-Y#W|+ig$1-`R7ROBdKM-unH>>6BEu?g_3_<>%{x4=3^(VyoBn>2R35x@ z>iP$_fN^OaH9o8r5l%^k_lsi|xn>A12wvzlciDUpGN(393#m=T=21{G*G?MI2;Zhe z^j$G<@{9K-^ZrEh{3*U0dfx5_xUiHO^z8DrV+y^*qbN2IHMdJwCg3t|mku`m(NGIX z?^C}xlYpcm{=-tpB4^RJ!lW7y;vaZ-0n54CJjLF0d{*T*mZdiZq7xVcU{a6{8d%lo zs1Lv9X0h);XJo<0r4D%5$fBl480UjITNw1y=6_Pg*vpSAWe4d z+q#NW^^wcG2x^RlNz?jlJ&}Jw! ztb|{`cfeI!u3KQ}DI%rvvy#PEeHVQ^6D=8xppMV2&^>Mc)NbrpGK*U#4iFP^J^@EA7keOYMv83+?mmbM3S3GwsvuQ|(o|LN|xm z2i{i5j}yuh(z~!A(ZXvm$d4;~*-WQ&X&m|{hlUoT9b;%Vy!kXrUU^ISvLnCM_s`n^dYn4?~ z!+^2v4bvcc{IUI=K)B)J>SNp`7D{;`HG+zY&=%1z!?B?QKE7d%MG!F!_o~Cy{EF?Q7liI+wt^tCiBwb?n$~_>WRgp~x#fl9g<2`iO zx!@GQ1Aio6M8J+$f=?N1|5Y;8`D6n7p{;dmM zhA0umONK-ICHQ1kR?z(8t3kOY7eZRh?^My{g}`miZZzopiHp#xcqMfnh#EO#x56DD zWtO@m?$c_CX#A`1K`1bCO}>PvySEP76y_(f>D+5^8FnnXrcrA}G&o8p=EZOtew}I8 z&E=L})zW;i`JjV}wB}EZRU_A90anS=j}W!F-*`Ge?AG6s+CZHm<4(+0PMnx6>NV{n zD&NqikKGHX&(v&yZC&?_0j-RN=ZR_Wzl$mJIXbW}CR&SvjjzizXh6_E;f3jB&!b6k zb$%;z8w|NoFY_7n{2p_Gi+=7F66eMWntKCrB1X(3MMZ>5NP8NA5`sZ3hXsc_>ssO> zwOthTm~h@aWexWTv$-^#xzebOTW2GJ$R#!+7!JD=(BG;FpUJt_SEs9F_YzZ9|J@X4 zW=nkl!qEq9R!UKBrH&cAjW663jZ(@|UJz(ZN8x*kOQ^CLTmnxa0ws`3o4E*7a(dsczuT@URnpa=H3@9txT$~*Q;E8(Wx zHaz8C3A}4zLpZwXb*u(cO$erNVI0V0uQMPC4l_JW8pf=K+b3LjIAdzdo8wbtU5GB? znrIJ3v*X=C!mb}61f+`Fs=eiOr1jI9Tj+ss>Q`;_O?qy$U|-i#fHwxF+WIt}T>VFv z*H<{;EDU@C#f$nOFQBADD=4Q-i{c>kf{MOI0e)d7&4k@|SWEiHJ|@IE))7hnhi~qg zXM*(!H_heZw+(ulq4@1*uGFxGvI+6U$MrI&mE(yN>@6A~x!}!fYec_uj@9}o{xwmf zZO2{~=O$f}06BbC-}6?yfU>4!PN{5ZXANO3z;w$fp({UWu!w=uB$;n?zc$2Q-Hti$ zmzep^YqLYj7C1*Ji&um1Pl+~b0TQMj zmwP>*ivk&C>i&EDQZ4Zc3wQ*_g#4X5opn<_x{L0KBzb<-B{e1^TrnWVFy*$`=VBWs zJbb(i=aC^RA#~5>Id(V7;3Tb$>%b^-Y>w9(93j)DVMaMAmB|2T*$U`V77)1PV_JD5 zov4yoRJ;`jVF47V+QIXRvU&%>x!!ED1!4In?*qB;^G)@v`lWT z^j3?2En4$-6wB#uWk}~len*-!if31+*JD}YP-p8~n0sm2*ur}42ale?WJS0`@z}j* z_W+G2MK(uB`n;aI+wjO^-Zh>+TN+sKyky6^GN%7yIe? zvJyt#%R|h=qd;cW-XOiTFjvf`1`HQC!jRl#a7ygtL^CZQAIT!z5>;F!(U^mre@tgq}iyXC-AR$1IWoh`qPtUnXwmlr;^&$7UW$E&`Bhg0WU^{<|ftY2NL zI-3{PAJ5e%A?ZFg?;iHg&!6-UYhJ4=7d@R$ceQou_e3?@=vfNNRIQKavmkGw^6=M< zo2BC%Fxsb0rB`EchHJyF_p_tP#m8w}b`yo_iyct+ve+OiJ^lbqct{)T~0Fd~w>;mCY$&AdB6 zfzpzZrEGW_b6rGMo51*wpbzD^OQ@Oo!}B1yIuk+ZCfdV%tM5Xx=k8xAWzh$w1YEg6 z_yEkdn-dcqZ^1m6Uo|CR`))I$O9K&>_9a%b>;90 z9*~x0gR9{Y(`8zpo{%~|NQ!f2O!fi3G}MnK9r?bC0Ytu>=RSV{XOb&|`gng)1(u zUT7GbYr!aYXHq%4C0Lj9X3rEQV_1JRb%$`XS5VrT?tSc-3^5|_=`>Q-XM3<2Tw9&lQOlUSk3vXscn z{%Qwr_GD%O{0`Zp?b^}6TmqM+Nbm79O#@+c2G)Cu;MOrFU6hkf!I^uj{%~W-m|#-J z#mlBSJOi%cDJ5;bS4UhGybNdE4-L;UsA!52^c7`xp)pfvS-&7IVZ1F(*CK-v-v1f( zEZ=G+K0pZH$yEZ^3r2xri-u+vXmu9*HAKv#_RO+mxL!nBH1b^0sr-@x0P{54PB>d}*OF1D2JiQh+&IK^v&ar@ZSYaZ zzs50u4nxiff2h4OYOp>FK(dBB={d~INQQsA^||(k>HIoS=ByW)l8nLd@=Ltoun<-C z%@W@NTv6;(w*IIb{Q+SFZhRa;Xi=IEq$L2;%8zIgfN4z-kr#|<4QLPnF#ljqs+*&Y z6^4^U#2v@-X7=m^9tfbAn%z;;oQl;V{A&i!l811|0a;D!?Bcf=Ip|`w{;F87TX8*| zD*lNU%+;@J;@W@|7C5@_yP626%Kn}_7TiLKHN&HyMd`_hOE{#Iz3Oy$Rf`Lwx3sU` zn50AId1x!1H@)qn=?|4MAXa_zKfN4O0r1OU{;j~Be2XlcgHx^PakclY?i(=bSeV4j z59252TjScaU$xI3Y;JF6otqP5e0R6gXD***a9Wq$A`Z}gk+|M#IXvK+37J*Q@U&R?O-)Ph>gzyYxLa4?evgcUaTiv>o- zt`>qe!=XR$TQU^hy)G5VjE_;TU>2nYNP4z_-W@VfK@Rd4X5UhGG2avD5#LfEiWpAY zAUJv+9H&lI<57S@E(GAh>{$LV^DZKA$S8ARK%|!io-1h;OG2mHFi51LkuXf8oRKh4 z_RR=f5|n^M{ue0_5))jpE*$>3dYpo3?t=GQJkKeS>rzUhWDI^(dDuH!H9_;^Bv5MU>o9Dhdg9vYz-L>L4k4R z7JVsr-v6;yz;pu4;b(}9&qi2A{j zg_dNy$LN*Mp^!x6KoVzup%l9Mq1nD!lp1-4OpkyqLm!CvutQmN`rx!M?e?@SOiW<6 zalnCRmfXCE)#cM*XK|MKK$`WDHEU2tYbs|S=q4Y4T-|b1 zx;xa6&3XFj+0sAiFYrsT-ov6^BdnU_<_DfEvII|F%+L9{WisBEZ2$m(kB>)NjFG=Q zKxAS2EzsFtSV#X2RI-K-AAMAc>4`HU47p4ydIJ<8FP({CWC;27S_Z3mEU^2$Rcw=B z<#IA29Ak4X9gQd=nq+tL1v?OsTr`jO6Q^|fiBnqo#3?^NTz$HqfE;*ZOf?up)P@a-K5Uz495Rr}+Q zr>sbSJY~(5Q(p9K)4}#L{BYx9h&Yt2mzzFH@GM=I9K9?~9gF8VO-bZnq1;b~dbSh& z`7?J%sOa_u5aP<3=5M0(zZ}BK_CG%+mNK$7aWo}hWcf2|Do#9VfB;7LDWeaa0uo-2 zUAFO41!>!79Zyiu9r1+JTV$JE%_0b@ve&{kgc8`W4<5}Nf-ViDJ9Gmhib!Q+HfY~D z`gRgszII3sM^^K?&IM*yvtia;3Z`(B59ZardME-*f(&w^gwV1juV_^^Xex>J7{_B^xVP!)--SBTAE73^m4D><|ZHhzDw^0mK!L|lElJCT9 zhp0q6b~+E~BjEQQY6Nah`@!{&morb#ls;K>p#y)@34V*%@Sh7-WBV-*0Si0Rzrq3j z8?4s#308Yq;gkgrXdY?*a29hTllB85q}D_dFP-zS={zw#Vzk0sEo!9WDB2krSo?q# zopQ#deTO6kcnV^R5J-6b%9T--U88UTZ8K8WLVrj;!L;>uHs zw?v=OC6^&+nsOSL3Z&yP2)tnw1gAHqn>BU?o2BtX>ZhB z2q|TD{W$(y1>4aKG8Mv-E7@K!$U*j%965O5a)#wPv)#Kjc-$zTgovFR*QlOo*8crj zqCp%|^d7Jo;8M1suCU4K= zU@CoVwQu0d9Tb@;D9zpK*<(YnNvt9~Munc*_1X*=c0(0D!ut5LxcSDI*8z^Bz!-hD zReEHU+&X(hiOD^R?wD0j#wz`mT!-;mE_g%XYK=)=z)qZ00hrp(o-L4Z>*6gPk_EZhHbgdf{)A^ez_|FrIWQpK%-8DNC|fV9*58hLqTp$Ma&yfu?% z7JN#yuIFX3|G`5IjVbpUn@ZBT%_VjkMQuFrSf~o=h%QSS?=So|W`u&ATwb&xa=521 zk#>tZuu&p)^ke*rw`=I}jggNr-!7}m+o-2ei4F|@N!fo?$= zqLn9cjt7}-r2h(rs3BV>CPIFwS>r^~3UNy^ESB{%H%G)@4Y93M?bC9^H{93VbwdPn zjk*h}HptLcJX<=R1{)Lxrra4c3L6keP9q#Zk_u8eq6K|&wyG8=IlrQrPvz)wi>PYh z=qDgPUoh3*jKbf;*fIZ!swW&PY5mD6`)nRiI=!Ac?XJk}zUJrfY@`Hh`nhDA0{%)_VvixedbzoqB0oXzvmv+V;9&q#YW zt}UalXI+nqD&;@4k-m|YZlpy-&^`IF9Sc95i8Kf{e?%0HO5(KVYxL8c;QgFpIdM14|#1RX%?(a z;cTx+x0gQOgXnUq7;zg5XGuJD=>#cjQ*bHlI7dB?<#{Ko+!62HcTvDMOt*HR=KD8c z`z?khBh#OH^}o`;rl`S~oYxc(atlD}j^U+W0Yq#R^z-Zu(A-|JOi~2V!$KUo#&2%h zyv#Z!d-y0);E-XaH2XNH4H4XNGEGDQmr@;-f3U_!MVPc`9tA3%h4d7F>}0QIB7X|B zH02KS>|YtiX5i~TX}hSqNJf}s%#fF)DCpUZ#OpYD&LacSt>iYYx|s189@5=3ih#)9 z-^>kxggY#NiN7MIR#1V~nV|^Te7Nli-UmF-4jk-LlH*@qWue43j@Zm*eBG@Iwd#8u z*JPxvQI zvug}LvS5_&YbR>TQqgDq1I$^8&5aD?>qF)e)zEi1_*V+>ULdXDU;#*gP}+T2UwRsX zYp-*qcvs{Z?I)PCnuTCN_{zqrfsGx!Fg5`@Hnc2`fEN9q6ky^%D8Le<1`@nH+1R6B z9Y(JDYbiH)V#yD5dCN|MC>p8CDV*#P&#r4L|428ULEGnSv;QVuztzG1b9b5?zqM2T zx7GcV0$laUWD-8A*s~^x^U+h2EjxuhelMO5Cb>9=NH@^cBLd2G!O?*YfIM`y+nr)h zfz6Jr#59(#r$d692TTkW3hLqEr`n|!#4CZ4hn&PfkhG1?tNdn=5+NrSa#F}6S$UCF zBiFe_u_@2PIS8iFxkIgEv`_7w%p+2z&1oSR*%gFo<~=`o+dN%p@$~|Ss;~p?Bmp;5 zuppM?5N14w(B?~R{}(HENsBJKBxBW9_3w9?tgaGhm!1}v@P|+q*=J0=;)ly^@L$u8 zhNRPW@9yx_f}dOFUTHs4_qD(MO*8-2hMbY(PwWxxIO(_n0*IieEPrUn#9xqEWfzEWvHzisew1iZqT>D_>8GDc%a z*CPQXCXV{T;hAXcguz6M;O`WOUa7cIAXpqBeQg>Qt1{;`5Cpi2JI<{iCFae!wcf6t zeO>pkF)Px5(1ITJvkzsX2INYliKGn*FDRHWwDc0g|7~tacyY0MAV8eLY>x3RYM_B0 zl+7@#kMZ0u3j^fdnd@?&SLvko55&BX&r_eAESTb}vzYsupz8qWPfivy ztXjsLbTwzk38(cW4=j`u}_l|LY+}rHlr2gN^a8Q620Y|LSB}#St4}aJQ}}EZw)RNA0URN(YJC&V-sNmM(u; z4K&Gv3#~8=$;s7*A{`56?<>mhDKO92K|Mbw;Br5nBlG6@-R39>ujYs&CTt-#D*(gl^NJ;&LVd&{R=vsle zM3avAv@p4h$;ZG_w!`VsBVY6y96;5bfs2+N=9$t}L*9TYvC??Qu!(qV4-&-}RNHQ* zlovMl?<+gF2l!p2#TyHHqIb7e76;w=+oqwuK&E+*JrjI`8T2Q*Wlv+zd{js z8IQ$x5KPDsN$`@;o;!j1rqL>K<2Qf*yORN#Cf?(nMUp#XSX)Em|8`4;Yjwv!`!74| zXuOE3rxq7US7~T|4kFPa5nX>E(VEl3rm8%2&9~rr@(tk4ucXetJ#1t-Q38TL3Pn(0 zg`$YRDHNp?U`X6%HlntKbOOH;mlc5pXt{F6W#&Z9m5nLw}qNFcZcTeg2=rT@2U zHa5n;RI`0$`!9_*s^Fram+?;<@+StuANq=1@_;P3yVn)O{FX>{cc$QNd(u%EnfYQ9 zxfDK1ZttON`dMSj7i%X(E+l1N5ZZ5y)kTWLt|tiQ(y^0R7foXPCUH?dbGo%19I`Tn z;nHrdE%hfZ@w}O%5J6cp3rjpm3jyYIS~VnLBQo`i5g%P|{0;HIDHa;Pp_Tj)!$lddT)41bg6rC)isc zpyF&P|Badc5@P(n7x8lZB`C+t^k1O`nCSRt(tHzm4h4ZLY0bR54Ht9rp!A3rLWE%c zi!c6=7Ly&MRJxRYK5p7Mb)L{KHhiXArA$umk-9%=pRcNMwTXR78ShumjiPjhp$x0Bbm5bBiYI-tm(92E(e4I0L$PL;fMH4&!Y^ROjo-iKn#rNsx;(_hgJ+Rf%WF14eWoB+~b zFst?8CqAKyqlZtIlJuK@fMH6PieOue{;u_@T&~>oY!>BAGR;2k-MmwLEL!@RA7FMe zT4E{VsA#QEAXKN+;?iN50gdUKSGI?NA(T1`r{1Rl1Z~DSyG7HWIo)bh0zVqH_JJ$T zA*-jGD*63ZdHK1Gvs z%8M5Hp79j00NCAiZs*H9Bhncb3fad^HqS`|>}$&dsbJT910nHmgl&Y7>0=aqza-V+ z$~%(LAZqbt{GkNky+L~9k$gL}npMTtvxDK)nONSj&Rfn#7^ZJIWTi_uWa3ybFcURu zAegD>J8N8YKmR63YdOOUKT5??HmR}{Ar_6KvLPLI`_D(8{QD_UUMc+UEAqQGG$;|= zohv%s^v^7P$1Zr0PwOR{hC{Es4CXCddj0zY)es1paMVEZI;OYx^nH46I}mPqX)c{t zLE0_KYM_lIv$bO@BI9KQd%nex4DhyG@!U=&F3PVX%oP5{2RI7kC*rhlVI5&bts3W~oeQv5L! zbZe#bA4LlLUYNg|3Gwe{`mc%<6@Sch|Hn*@f6Nr}$4rMFHXmbN_H0D>lkCQX(vRYJ zc=^(#{uhcAA5v{G|Badc68ibScp>^r7@g(oe_4oBV+Cur{)n@J)z|Ffe<5dGJr@^u zf=PvRTVu}{RXqi10ss1Xa@m%lWD=8NN!o{8ao4r%yKE-*4z@?@t|fkpmW#zLK`V!p zWYP@$F>28>X`jey0ULmDHecU`zW8qu?GK576k$}VczcdY6vdTNDbL?5s)mUBLMAL9 zF5%lhlMpe(n?V?TZ3(&tK7P%^Pfl-%P<;)#4Q!qH?Dd;%=k7esdg$AHKYEB+l%2KL z>C|OT^BN|5!ZK4V1MN+2d3ZSU$$mmHFfqjwR0(4W8O!Crca$v>RV|^ zBTvxq1?SFv)FbA?AMXfL11`Scix=uf#73x+mu&YL=hA87sx)mea-LXgQpIX?>^=7E z$7#J zzSpcpd?sNqBH*ZxTG@PqCTYk=(g`-%r>IC(`n-vn8RqiZ6{lqkQwPj6;KtpT6aK&^ zM|xfYYw0W`Cn5Y9$c3Xj22}H&Up&XocEFur3r{k>itz1%p;I|o<7toQ9=C*N=7n`F5F%H-xfpFD?dAz97Jju zjD%eD%3RJ{;S38;QCZs>@I1?H85weu zAT`?B8_b`lYTI_giJ5h$q=#1iM()G}X`c`PDszoDcZ3q`v2|?=E%^yP3z?rbUb}9r z#l(tV&A9$GtCmzNB>qIlbcXx-yhYefMXlD#{rBg#sGrXhe40k=c?)w@9rh((`_Jvl z9#Ni&wa+=7mN9ML`|(=@F0XVJHCGYo-%zEM^&qnZW8;JYXI#GRXyoT|7xqB*KJi^Y z(gnq1L9H5mk(*%mp=Xh5`2ADb9F$r5biL(L&=gc9MNI-Z-gqu-XCCZ44yQnNS z2#@h@Ap0I2raUq;3(iI-Kmc(Mfvb6oc(GyeQtE-aI?d=M3fA=VSEd;vFJ0y; zeYej^MiJ!uzJhDX$_70@^*>z0MFn?4?|C%LJxr&P#`ft$dgok=e)SD;FtNPPd9HT- zhL)E&KCE!_6`nh0q#(vgItzyd&1z|Di}Vfu?Y&>-Z-RdlLVs!X{J(ZtU}E`80GWl2 z>A!HzC%T${ZWQy$)SsGoze=ph^IouP6yIl9*zo;OY4#%GhapK^sKE(&^vVib#9-!D z8+W?OxWU>DwOC+_JG`eFGAL8>_eQ1ZZSI00BKb#d?|Y~FJ3%RK?Z;e-TSY27)4V%W z%EALw8Gdiq`w@Zyf(xvq{IAtJ*P*=k@$it}ASY+r()Q0XJ2R$(GkrMP9P@wKy*Y^jUkJkKbN|q};p6qT_U4nZ&d0~Yr*%cRE_=2vTlm!4n<`$s8Zg%Oh7W~X zFYjMZxO)9MvsvEe$=?1pu(=r(I*X~q4fhP;*W~-wcuM^ z*Ls+l?4p|3l7)yNQoM2;bUB?PLXXjR3vPC^)GE!_*h)yE%GDc1Ir$jw zLJP}NE_=;3h{x=N(HDA>=I2Jra^&(fhSIakF{Mt{9HmAjlfXx|f5#&UO@$!G*z~SG zn|+V%KP{A_!kiXFd2_5dETw+=RQ~S9x(pdD%Qk}ah4BCn6>&+T5RX2sgMPcZsI*kk zk(yNZ;ebYjwwBgkD3nkbORiVc@)r?@I(8k(ZEYi^dr_4^1f~8a3p8);r2;|z32uf$ z>3r^^rNq~IX);Q1nnvGH7_fbiMrfR(p+=>NtP<(8Dii+bn5=X7RVfPeHQqIPGmBNK zx{4Sgw;x)yh-gOo86gsO+r)#)?q{~dT9)fzzH+w8!E8>tFiLp9m5fW!_V|_Icn>uh z85O%BT9l?Zan_{w&&;hwkMh?H@f;vs;K;mKK$%{WmA@Q~`2-INy^jiU{ge+Ip?jAe zyN@c@jNaJ1FVTTavEzYEXSD%~ zTC?%cP0B0?K9*FZkb0HNLxZ=WP)nB$2{N1HENN!250jfeT6Gk@$W@$n?b+mud$+-y zsxUUrapTRLITcUz?!m?L@(QVw?Jmzv0_32jY|2rp7}e@Wi)Ryh(u+(GD}AcA1d}~G ztXumTu0cA$*z~@`*@RzlSHwND0G(PJGtngrl+K2}dcOqh4Ck zE~#7$CV9$>aB)>{DjE#f@dP(>fj${s$fHCzXS`7-vtc9?pOs7*0*2HK-ZiTNO^CIn zhGt78AKD#IE%mT!8@4+BCC~9hZ~Abq@EVoA$c1BY)`EWnH@u73QueFPIY$i7s?gfd zbmPt9&xyTCJ)L6(R|g}C*mV`{+af#Zn?rI){fAeC%W_xAp5ZZACz&43G3(fKQ}r=} zQy`MioGhyhi21kg-RipVI7^TO#mmQC_b1N-SFRuwY{zX3i`l;A%im_XWRbAV!#r&d zr5`!h-mV;teP9kp$y2)LCCRc+c_P@SvKqCGr4ZwVTqO=ob@y%Tc?Xx}E2C3Nz3uob zPfOwN%0u!R@hGG@(RAb~=R_+Q;Fa;_?_sjOPWpjt%RrH?L2ARvfZ0cZanrv3xdxQf zpaMqKGELotD|%~Jv{J?w(QYFXdWDVqN|)=(#^`29kzIwZFYo%UseF21`mZm3kK)SH zP=5F}kHOCw_Nil*?{hKd7dvQ(G%C(?Mw{=Cx9?YyBkY&^3wLmJa-0_JCSjPD1BRM4 zxh!=2&T|Wb@m{C300#YVUX&=1DJ&@gSOzcKUdAK)0Y3#EKr4i$zc{?5l$2n@q@9l zO%Fj;lXELvNt+zC$0;jxij02^OWbo}swS;q3Q^*AoG1iM8-2*Waj1zW@KK*7+W*muTOoOK; zxA(Ia*!eYHVhR@cx$Mi~>9JQq$;~vM&9i?DFm2ZmA~VKN#xZUHwwS7ExEs%F4b&vD z;;_`dQRD4Wr~*cFliHHcRL2+z%CTuXo;S~3N2|Xyee5SDfXGE61`a{W4ACgu5=SPO zGp1rA(e7+wBf)>cX}-g!c?^I#6TWtk$@vf?+uuX%Ab-R_oeLWi?uYQJY!wGSkW|Wq z5!K9&@CYDu2dNT@bC3MXqY7a!R@i9e3o}aZy3AlwueG#%ZuR{;A}E+`b!85LSMOVI zTq8v2dkYwtdtq4EWlJhJ5rJPlNy|DRYOu&%36a(3Ql^LIwSZ~~Hu@6h}JG%ga%#1I5brC9SFq7 zLyD6-q=5y{OOX-I7&@$waS6=21CWqa$HQ|!Gn14=e04NhW9}^r{|Zq7VOTI8)NwBo zk8+hpExl_bb2y4q>XWpf#!HVc#{^2Hz-Vfriq-i>7Nbxs5tBpv9$GD4>kT)d#D(w8T|*Z9XRWBRHH&mI~U4 zezKT403OdVtM4ZYe%f~_3Kb*zv~Q3R=uWhsQF@i+c5)djpJ`+AY}*~q9xSm(=QiC(L7M&gpT&l@?Wf8!Z*#l63g z9r~~oUe7gN+n%Vw9kXAh6&S#o1urCYEA<$liJ+qDt`wYDEhaiU$(BaZj%7?`q)bV` z$PQe^@x7Pe?<&xs*K(-pXu{n!%Px-16ee+s zZqq5`pu^adP~;;QEu`A2&urQKnpDYJ(7nY03NqeuN;i?iT2v_tR>s)h*0Je$tK*BN*PuVj- z!NynvmyvkCIE9niU@3lvWC_TR|AqAfi>|}WG`V1R;B=$o$Ej->jE-o@Qd9uzugpb_ zsy>o@X+Fyyp4U{9gdNn$rgyrQh7P2oSR)zsABfA%ZFG*bRzOhc$t!JAwa zC^Dp6qJ*wr-0BMtuKJe0Yl<-mi=Nj!Zulzzn+tXjK9Ny;Zx7&&`Xe_=xeSQ#p`I>1 zC8-rz>}Lf>f;~*`GVi0=byq;P&um{Ci(xflLb6{5%+A&TgyW0Uh*013?q?Z|4e8lp znVNkSs9w+)9JVkwRW91EYE(5}hPTIZZ06v@hE@G(eVBD?CG^YvOad%U}l0R=~^t|m3+kH$tqj+kP=6`Y9eGj;i!V;|8g~wWPj53yj zkxtH0nooa0H{m0zBI?f*sO!sR+&?P<%HzhDWFX$V3BY~7hFkEr!hs9Xg{4t=1~ioT zlNk{~mj@**s|t8B2emX#h2*|ghb~FWB4`~4$DsA&a;cn52{rhLg zRDzgjb@&I#BbxP#y)8|t1G*zI!~QON>8HDJqR;~=Kh)6NzDFr1lYqT#$z8!3$mKBN z@uq8IfoM0g?d@n`RdmOZVmSDY8JWVK;?E)CQVo;IpDfy6$5D2eQai0l2{SLW)V`fS z4vsX0_kgwI>VB|FM@@ZKQ`%*{q|;z~)Yda3(r`z)d74LqvKI*I*kC8YH|#}l%if$L zoLh5&zS9=4`8i|jA6JFFqZm$_@zl{pZ@pv_7l(PGi4%dHYTFp)R{K85??=ZuqmhA> zxb%J=2TcC^Cn3e*@7ecaLQzHYlliB?f42le80VvFx0-rJy0 zE|%-t6x_r>BzWQB^U)wXi#sbem|HmwLm;@R6~!4)J@)g0xbkM^6}35$gr^oAam+0I zUlEr_#X5s8qStjhf_FssU$FRaSUcbg;+;@a2wY=H&}$MuE>SzDeQL1Wkd{FcOitno zKaR1d0_epI@4?#01!5Y2o<4A6t14UR9J)xq-y$|23AQUB7}IF5Vc~2lF2m+q-f#8q zOW5}u`W^mk2ya{HC1W;;QQem0)fO!3bhwt-x34 zdlyqaJv*$gF7PC()LeR+Tr!+3Nz-l0t*~^5b$t?Y$b@ESXREYS?e{}TfKJe1~=`$nNN); zf)+#X~dMa_pABnx_T_cb=BsD)n)+=w9T%NC7oaqU)-4zvRwmW7Dzdc(`yd`bl#_ZFLg?*ldg z?wV(Q9&wXxF+qs?W;=6taK)z)B^|40%Wo+!#jBI^on&fp3`eD}>aR!XWouy&hbG@k zMx@*65L-w}8iCd7-)t-{z0$WA@=7Bi=xA+TY#mgWPJ`g-P}tr) zcWL4ZZE1aaHGN%yC5#lCS5aWS@<|;V=6o<{QToR1n+vB|W(B+UOncVy0u9|$fdhM8 z0kz6n=f^gYwO41lyTCrDu`W6&{S04s@_GN_fL}*w8|^%`eCOLE%o80iDb{gcFeZiZbK)P;NSh?2AHKc)me`RH`5+OW&K1Mg;MuBhj^r;hdVtP6>ktd?w zwf>FZ>>;e?e-L6!%>Q!CO31>=QNhGP*v`h@&ep^hEI7&_Y-erfplokoWWpd~;$mTB zq9iWFAZB6hWa7XeW^LePB4T1>XKcbCVPaus?nKDO_D_LQCPr3PW(H+vL#IFTq>?rU zW+s1ED%Ai>m6{kiF{oP@gIm>@{#(z$NxEzp&QQxQLLuP3lPZS9|fD&5?=+BvKHQWcar6xnBm@#4;Hv)>Zk3RA&rb*@Qh@ zDWZvzP^?<^fV(aK_W6;!HPoT{TsD9^ae`P__FXJjHq+RYyLZ2v{{BN-yoX%8fmk zm|Lc3fz14dYQ9^=T(FNAS1+1Y9F?ephNJBpIQ?Pf%0m#Y$e)#SxIQWNc{G5A_>3_Z zKPp`O8MbL8sq{XU;%z7F?Uny5;%%b+?d9$CW#>%)`KUAf`Rb}>>eD!x>&+8$=P@Sd zlwnx{%-oyC#G^qQ=c%%i9r7Hc-HmqT9xxR)rn#>&Y49fjaL& z+fi>f>z!|CN3IWhmE%Jz{ME6jy-jTvGzsUo5doOCo8Nr4!gaN1VewuKhJ{yt>v*XF z8|ik(#SHdi{SQA)eLG|<)n(3!VBQtt)1h?}U&U63``Kd0rf1D&@OyHxeHVbSRi?dY z#khbkUdkS}*mUpEZ-Wo)o(JpbF^}hAe!`FUI|?q}9DQz8xWMVlbPhx)_Go%ut0tGJ zx#D>}6Y$CxnrYv-%kim~kKm-xbzDs4z>(P=U-ZPuFLD6eH4+6C-S;y1wEgYIcjmJm z^urZ@iip$PW_yrXrIr0=#USFQp|#D>9A=)%a}n0WcX2Gl8Br&(RlZF(6tyQVm1kZ5 z^_un~H*BZn?o`nk87S>iBoQFgl|cz%52a;1`|`MDoS%{U#Vq1T44{)jvSD6KIt7*e zCSEDttMd%VroyAx{Io*iX_t$piumqb7gLVv1;u=>=bKRi!{))>i*MTV42g|Mw&M`5 zmzB3XySrfp&PPSUG~bF(xWS%@r{gL-&Xo=!R$m9+~C3S-M z)UOrQ;^+jUP;E7`YgOOpk&a())B4*z2Q3i=ffK58kiPS~TFQB6~B+9PF( z#aUUPBjFQ9)lds&e2`r6z1s!gY`|(lL;Q6ZPvwI6rM#d%={h$4ceHa6gD1+r{Ojr$ zW+y$N_uG46ov(XCBm6}W&6WeY{e7}`yW63%P268bhX_(xG?AOPy3>5+)*@W6D9%#d z3fK3S!X%?GPJbmt@O`TQzQB(Yy^Glit`!dXw81x-|PF~ zxLUuVh^bi}Pdr`_i=FP>RqR&_u3V;Bph3nB)*Ru~R_{@NFym^{yu%4t8@YB1>`@3R zpzoPPJQT5<$*T7^C}$JQZk~;Id3Y!PR?>uCNi?E-@r;^bodC~%u@UB^U)jxLMr>HU z)@8Y|FC`jJlTs2E)BZ?~XvslvztG%tga<&5ynkphOvdgprn^u)}fNypjNt6 zLaQ~sN{<;F%^wD5u3{T{2@abNfdF-J#ZD@=1H`(;msIL#Y*q5BOW0$%0<`E5_BnGj zGNmUyT$OtDUn|<5TvoBea@1WV$${n2*&?nA^|WO^S58qdP2Kp+? z_EGRZV>uJ9tERfrEcurQP+%6#oY+5XUs_L z;HOhP;I54@l; z$;>21nsiW{3fUW$P0R5wD}x<}5xu7^RtJC9#9NxNO8pc9mgW|1pjoy0r-bajOk;~@ zldPwx)0gb$>wo=>^;qr(=-=m9Qwq(&;I`1yVb8Q zxu9mx2~WOx*~~nV0X0YY@Vj^)G#2jK!PHBB;9%{uee@Bfha`P3PWqy_b7A@pryFes z?ss}R2mJ9z={m^!jL+F=s1!27ADZ|xJc%#JRVywnRcn|L7^kU~xh!fkzeJSjzMUlOz*{8GzK>t2 zn7elViv0#MRgx~98;jOGTrz5p&WfTvi zfIjBw^LFE?HA9HbY4zmj)GSRlsIpBVEtMV6c{&KUYb0*|OYb~Q4@j4}jw^C$$pQdP zYhHb^5c}ae9JjpKXi?s5@05V%E`^pmz`fK>i%!d#lg<1&BNSKkbRUW)LwGhv?V>ty z4wpeWbz7qSn*M3ycvkqf6ZVEH`$p*R6zFV(*`jjrFS!_w!8)+VAUbz}N9sJ3TWFt2O3eS+c8 z-@HBU`}>?yE78FmY|D{$X`c6`2-u`Td%22%=_A~wip#hrR}~RCKFVdMh{L9&VPznS z>OL2S*iDA!DaK<4zLT4Wx&_0m!k#5gvnW5L?3oqwSzo$@J`p@N-FhQ z3l$|8zS3C=P^2iG?_rsYc2*Br_36AMa<)WguuBLzry)>mfZ1c#S^k-7jdq;$MF%RemVo3+NC!^bDJ?GExw-}ey`TQNwu7kc=NHQdapoV5D%R{ zEc2q4iUkuh2vldoG_-*iE!04@)!3mfb^D5_P9r>z*!%EpTckU!QONK|_3NLvw`>V9AGx*fV6&|D z*OGN|$X@ZYW(pufVN*0T971aSOz2C z(>*l$AWt8R8SGx)qrsvx=rdF3!w5QFYgQ97mN_`veg_>S2S=~r&^P&1gSJ}TJ*&So z9=t3MuF$DdE3sVuw6lJyPbpt6owZ1gW?!4dx>+ewgaxRyu>l@st6R8>ekGzUeYevy zOJmfMp%-lndII|UFCSg< z(A)+T+*A`wFO=o?)QdHO5`C60U z*f%3Od5m}vc3VUv*T`JvFxwLn`%W5V(VKlet&>N{m(N%b%_EZJ`S8)MQKz_XYNIA+ z$)()%dxYgQnST0q4dZuxFE*JL3F+!EcW@R8Mgtc9B;mXZ6zhi7G2UuOXhSquR4rXWs$VQ)ifdaO+{kPO zPucJ8_9v-cEVGA|WAx|Y|FSLoTH?TY=C+QJp<}MlAdqGx*InlZ|FHX9yFk+xnbZ5+ z{b#Izaq!`h{8L!Y9Y~<09XnQ7XYRyb@;i+X<1wOTLLl46SRL~xS#Yp4 zhNl<1VTVMv5^d4sBL)vc_1HnQXuGr(HEo<^U4B5s!ltz>L&BJqx0D;<_|`3zBE{uNC2F5qMYNyfXn#iYG)tt;P~|Oh zIl~QE5qpBQvh9+gg909~iwCzkHixX@G)bXkX6@_lK%NHbl<4n}7nu9QFXFcrBi%5S zDF$tq+>ePV_WgAF8{5$|a;yP#dF^ z%r8&z`69bZZ?#G*9R%3m9>@VDYesy{GZ%e<%%ubgw17(laB`WrRD!^;>hB)~g#WX& zi7k8BcV<9OG67R*=UE*tlaqAQx3&=KPkuE`yjd(!&}j3BUzpb==tW4dL{N^Fp5(yB zTGh$|y>D6*3A-r3rFNJ;{sFhBcc@=$Ky$6T*}22#IBP8e%%x=;&j;pACO4@9a>;RM z#~$;J1?J)-FrQ@SHtiJxowa`gpmx1HJl-Bbpc&w&);FgOi}$}ZmVN@xSd;c-Vla4N zbIo@j)jZ=o`jfA7x^fdXZhGhK)!07voN8Zdd?IM2L|A=^_`prwwJMu}xC{>E#*!t$ zuz3Y?3&y;`*DD8=_r?%T64o zfPpiR+Hg-}t;=;8Jl=#C_}ZY~@1L?RyR;di@{C7YwiY|RaEMr1WJI^a4}R-YRWHjj z);UN(hbR6Ur-XNyjN)wPNP)TbXnKTOzHSSY;9`5)8Eq6#!BJSE&f8_CuSFY1W-R6F z%~+tjLMIOgSTXc^YvmRrrns;J(CPE=>$vLqK*!6veuJN9nCa(B0#J<6jsUH~Q+B}f z0DO)flM*^Nbc?A}o9iP)yE~z^HcfVk*+6%bpVw7jZcQROLjpkd6x8}VVsPZ zajFg~n#E#><;aP!^uO37m%K4P7FBeF1@;xP`KtOC5iEO_!}o=SH*XI1+JSStoF_mvY_U-o7{ zNS!g0)>LeVRdU|}6gs1R647G9iyx8c<*e9hE`ht8Y{h@n|R(?86$Uw zI&P#rG+O7Q)VWKEY{ab@jUO;NNDBB?!HyJcQ|h)3dg$Oyqu0poeM`GdRs6zmW3BIg z{ca5RL2(uf=%1Vpd9_CZK4f-c8X+Tu91!|ssed5^FEzwvgI%NG&B&nhI@#me(o6Ni zdB{fMi!bSI9>|h6i7k~1=?IX)8-?QOD#l?O2R%gE&gAImaAg||zLp8woyMPt{>-(9 zpvH84;Y!Z8_U2G>h$q?MWkclNM;S@MO`&ZWF(I<2e<;OnC^+c&T>;ZuhKE?*LfvE) zSdUrM%y>W<#x-B_+N-D1*0sCt*3Xo+%akE__u{4sc{I7FiC(GEDKh7bA~Nw0YovY!{ zhXCN|3zq9yGp*SPO)T>0&F*H^llR4X9aU7<s$| zF{O#B5YA z{y9*l-J^?XyDm1NC*x7a!5BWE?PXeCe&9gf&ZvQtHmVvaYAf$@Vc_YcoYm794rYkz zAbSyV<|o-k3ncP10_)Fv#q12f0A-m@EWVY_yAEiG8gF&5<`sA21%&)I=jo-n-Bq{}T^x@l#?vN|kGO9g? ze|!GDUbrw(xlu1l?90W=E)OP2YPL5r+8>@vx=)_9Td&q$1~T<|K%H-|6^<>~=|wsi z#OVNJ83)0@o0Ti^g%gax^8=f`-~omja#ilP{6QN6G&&jYfmEJ{*&?59*)7Zl&M`QF zvlc6p+4ZGFz!`-YjsskPB{?Ve*&^^wM{VdVsj*aSd(A1EJjX zHy;i(qxO&seymLnV~1E^@o4f#UBxHz^{a+B=wz?4=^4OnGL*sziD#dy35 zglt-q8kV=xeGOR^uj0u1L0<`qGeXtpd{%lcSfz5%p75)2lIjuadW+bptsEf=^=ogK z`U2)z)2<0pMzu3~r&3?~YW}X)j>Mtc>sMX|T=6ycEVdGpKbYcK@!CGhjbB0cz(W3XRLpIV%Wo> zgtLJrZ@!P-%kfT$@GFl>NOIc^+HODsV3?9b-Zc$DgsR`jV+!Un<2qyi#AzH7ZPk_0 zajg&M`Ur*=BzDv-_=lP?yl^KCK#ZB6$6**ZgbvW*)EWGaTVo3s=Wd#s>O=@Er_0Il z>yYS@KKJoBHDa9(*x@~UNOM_9)@hy%s4Ymr9bcVQ8`9dqFnD34|c3-}C}spWUO zqKaj}_(G5s#@`&g^QeH8y&QDab;_=`7Z5O`W;G|VKH7xdOx6>Y@uZlG+L(4)SIhH` z`hjcg#$Gw|Cb2hZMosyintV7KgW&Q!b&cbhd7W1NNwMZE1cM{AU1e1qZwcSZscEbi zNGg@Um~1?Q1q^j^Lwm_@vhVkHKa|1?boQKgpl!d8I^+Z&E!{LnyRYBSA@p zVPQ4X1=oLP+FLxsp^bry1z7&bS#+4MxuT%O9m2AxCqZV5XVG61ed{?ai0)igtXpdEWvOCgf2~a|2(L8sjWB~p1AXG8+bUfmW2nRJ zk%4Z>#aWG+`+EZ1%dL99GaQ30C4Q zZQ|z*<9~Z_e!R*A73sf>*KbM*UcKAk_h}CY0hKI#?(VI~B}X(SeDIFO^gE0f(yutW zE9n+=~C0cj`riJ~);&lD-M5H#(vYl(K^ z-x9bKx8=RmuwC2ihTJZ>SyU5xltGh=2*4|K+lW;ER$%H&9yX{+XPO&n&4-OHS*rql z9qI+EV|$d2cZ=EXzQi&aQ*tbaAd2Q^?#&j_icrQ{W*S^mFkjHkC{tfNv^jM91Ks0_ z7~M{3HNQxcBJ9u~BNkTq<4(%$rGlSDM5bY-Q}mO^PM~2`oSJe7MXe)meotZd+%ZU) zt1AFE+XU3C^ko(PS*gdv`W`26I& z<>4L019L87uY@N&vm;K8uTTi^YyO9 zHUA8ENoAZ3^7XzxZmGS^BUaT_C{h*%c6j0Qb5*N zpuz<~=fSf(D{(c#Kb^K_RYiy;h~9Tn67P7~8G58g3ig_AiJR-PEW%};2ZmYwT3Hd) zP>=v7#voi;NwM1%ivsidP(uY83NR-VoybM5QREY$&&LHai_&aU-5$+BzHN*U9IH8rz1+!bv+uS{@U?q*yfmb@ zCh4R~I78>HlI6E0xY{m0nizccW5fJDRhO~uRqc3j@w`&5HI#e+kV}*A*4Z8TwcT_~hc{@eqI`f{mUnct**2Ud!8bfn4-G8f!hEpOu?%Mc zY=xggn#aMetN(Dd`Fa55j!`3>sXXM*#$)lC1(H);u-!kh05WvtXp2bT&A!XMSYxn} z!LyrF2I4uC(pVrrPBNy7ni#~u37<+BP)%ZBXw$V2CMJ!ymNo~6H8_Or?1;LD1Gv@d z-|ToTYYVAeJWp(7dJXx$l{;P>TyqvnEVt{GJ=rb; zhPzJW`fViH!|}PlA_}8y$K^{4K>XidUO}J6&=T8;=<`AR zuJn9qzE^Ahsm-R<3j9w-MIbOSs_OMp!wA!DOzZcywGe#ApWfMY+7{o@0i=1@z7<^Q zvF^Jlkgg%GsJkk%A>&4w+1s+vb#=t5cXi1E0r9J6{h0hBZ6wo!QQei7jseJQ#78pI zRpIoS+X?N9MIT;n5P>`hu(RN~N>G+nc_uUtecX1f1W>6@k$AAA<4p-fj3Y^R_{Fsn zD>cLDWtp(X5m0YbI%J;k6T&)1_B9#wPRRyM(`_y5NmeP|B?`PGF-Z~hm21lBh<}-u zGJR-Bu?(vVlZqw#U`7(8v`Ez0G8~+jY!*8RW>PSNR-=2Avgpc8Ob^}#+@iax)t)(M z?&ncqdLNDt{pRCI=rowl2uo0ZDaa$iPq zTLKxaq{m41bcaljq;Yeb@`+{|ox7T^mS^Bf773g78uZD+-!J_Wn2F#spbF<2N*4zK zx>DENTacAhGz`mSAq3m?+CGeZU6arg>GT%!WDgKGPJ;Yof)Fq3-*sLC6IeWfZ9QuT z73Mak=R!S33IGQ^HG&huJgsAh?F*NrbroNn3Dj_OIV4-*1qvCj?MDW%7SZUk;O1?> zP`NQkgcT)Z@wcWvrvnix@Tf9Jjo=Oh1fEguRF|AAj zs;Byi1XpDlIQPsl?FR>5YP;$kQ$fS|nj2u$pn%hg>0G`UNsI6c!qe$N70#!NM?j8!oljhkFJYt* zFjkUxfmP+g8oYtSaiYMIx1=oIAR+~1cDHzx5}p3&T~?D>FDKuT=k@YD2R@aMIV|Yy z(c*Rd66^Tjn2pPyo*6s&^nBdC7Zx^AjxpBx#;KS6vaQ9n7U{d==y1HUH-~<^OP#Ui zi=FBA#x_1%I1VhnxVZrD63s(;nd_%zXh`2Izb@+lt%N5_?*G5)&MK;|EnC+(1h)it zC&sQ!vs<;O{trR*cQ9l9G16{o`QQ^OA~k!uY52kQhp3auX{{o zHWEYFV<}D~9;E_z^_?(b+ic}*l-IHb=ay&42Kkn;N;$gM@CZ8!pIinT6)DI7z|JMV zIb{qpz%(!OqU=LqUb(U1ney0f4pNkoP&&J1y@G8h_*uq)K+0OW2Aov@p=Vk|+W}T}Jcf5q4@L5Xas*F&v#p|k-g&8gfrgVrO$2a9 zU{OM|-C%WYw}xx~O#*nIU89C*OwbSB1dh!Su|?UDWDjOn(Nxp|Ht5jfUBa3^*9xl2 zs|Xp#MH4$}RO!bJ{}7Mb(#N?*@@>q$`nnc>`8M+vlF*U@9s0MBY1Yhn@`5$*wXcO| zYDy6TB6<8Z{w+GzQ%sE{OG>+t_u+JPOljl-H3u0 zKHT_DXVqrvvt}^1MRs=2!EZQw0}@4+Ed1JRfH7`fcSiT{j#?vNn3ludv!Ic6_S+CS z6D6D@-9YVmfN<{C8f0xi<$y&QfN<7Zvr&I@mA>H%6E&NV^&uZJuybn43>;HGIblNh z&VjbNyK#XrPg1ZZT|49Pzz;m)JgRYWKb_pN9ul?l@|wRsSKO&MX{7rd{ z&W;Ga^N#mLJAv}v#pdih!BMGnajHhMc}&&)j9EW)b{z1eJ?@0BnU%9pt6*)J>Ed=L zV{fRs6mrSY%XRW*XGyv2{O4Kt*EQ9HvXQ_qgOHCmLET7e#m-Bzy7yghd$Kp5IF#12 zYs(GZ4H($qUS$->K=hTa2DnPHen&ZthIj2oUgEQDsUVVzX7F$Q@A6Fba%bPgK(;m zOst??Gw?GYZd#BFYWz9-HV;LOzrfp(p9l!K*|fHUCKNYoRhi}C0$IS@u=Eoixet85 zqtLK$x`F@FojtP;j~X8YqzYDnyT;SzW%KQ#*@_eROQiQiGACI8*^`jL(;#pKZeSB0 z_22u^`;g}fn%o?afAy<-o_>1Uv5kCNW!h0l3!3D4PG~YA@8d1%! zSDK466VZXX7|dsxs=e8smOxC1@CZx*R@>Emf@`mwJck2;v_kxYnV$7L zI1~H7VK&4gz=?p6wB$An{#V{Ybv!b6=m!nAGb0S?g&Z$aarB|q1P|b-YWnQ%+fWW@Ylyf!@yc=V1&n>z zxWU?mowA6r+KN#M@?3)73vH%f{Q#Gk8Mw_;=>|i{p z(babqU)kY1gpH~pRXssi$X^=m;<~0(AibZ0>0s+Ou~k>-3t6Im$7ahZ0k5fb32wRb z*=$1S$TQl+!gLj+zM*rr}w4BL+# zEv!7K}nfIoh!=!@2eN{{1tWjP5jj(31h*T76B@BRe5(%zT+6?kO>u_v(r z#QkOhaleOC9BUI}D^IxJ=%2tVwmo+b)YBN+vJ4a_z8tz8s~4+C|1#5((F8q3ySnXG>D z@0sl4uS|vn*Qmt4J^OH_!SidqDdHF>Mvhk@hfBbfi~wlX?dLpC|?nqqChfapxQcrSn6`{>)q z_gRu=L^XJHgx?)%bcm>HPLOlUm(JPW{2hIQu1Yp(H9|D_j6*N-k)SX3wT(~4#+)VX zmfa~)GpS70+le9g+loFJT)JA7F%w*^ZU2e*w<+ytietT;C=D+0oK&pyOkv-XQc%98 z7?Rhpz3Me296&hz4$&%6)e}`0pMEj`7YzNraWV|3!D_!i@H+=A;Cuv z(1-|kyZGFZk#p{zK8ihgWD@rSy#^xXsJ94WXdYtkJn&-QQ<}iRtL#M^9u@jCyCKYn z9+eA*f8gLX#n*|=Y9>OyN&O4TPyiCu3+*6IXyz_2#e1X!3bOn!Cp9pcu zU<=uTYhqq_1mm)I!;h}pXJG&zo(~gNtwbkQ#*4mPZt-#R+=QRUE5aKdWQFQ?=U{qP zh48;r!~Pe<@MN7Uf}iF7o!;t$`#<#7N+7*e`gzsxb==PwqWm+4wEe7x)9jz1dB;I$ zKxFs?iwf?T)`5ZgS)u*GO#h!FkC~nY{bOYNMF&MOTJ(wDDtyTaNsr8rODeWyD(kYk;H{46 z^rrZfm{%;#zw{Cj&!tVgx+N9t>v3p!P+Mr^>SE$d3CTzq(*mB!%!}Q?v{#g#Ewd_9 zXl&To$DOA43NrMXq%jo?CY z26g?6(7Ss!3fL+SD#w$oT4b0>VDzMlF#Z~;4+AM*gZ;95aodGusHj>K5RgH8==xwa z$0w#kO@uD7YW9OvSw9eVK<4R%NytS|!X?M*@h$5(xTr@Z5xM~ihDFxP`}(px8s$#( zY{=rogcB{KfgnLj6RdAiain11*^(nG-O1CAitoWaWFmi8H(+IY))wi%H?c51YbVSC z_;rgXFCL-J06%|=UiTh!&pM5w^GoQ!lXOuM#3Dq9WfXd6jybKW9-V!6^tiZNKLMT* z&RhIb9*6ZRr{JRaq@_#OtEg_923T6En4Oot4?F2K90B>76E-jRf}!fb`98LyG7syf zrs=)XN~dv9%9#O`4Epez?vi*}eaik0kNZ;`G&T-p`9x+4_I&0=_Dp#8DNq3kzsy8j zD}roPYV-$>lU2MyzT(jsKqot-Khb#+6nCY%f zam`rWiwloQFk4<21hgHNYps6GVM?T$!`{;3T#$Ib4}SNiBEqM<^s3v~b-}>?K2W&_ z3eDuI*Y8azRJy32q>qL)q&=O3ey{>|YXK~OE@OUV=DQgw3A4_AHs0P4(euF>g%PUY z9vfa5()W^>k@b*CtB;G{bOn2*`(op5+s9Y5mci(6ycAtY?)s0#sJ7mV3{=&&v>*oi z)#y?=)9C20y>ET-0>mu)3;SIgZUX4TYtNbK1_B9Gk8p2Dold|XBH}a2jK4tCH6vS} zXsbd;9-a6=GGod`FpZ)q&2?l&{yb7kiBr@rBvA0iTl9S|{a0J#~GOBQj&_eU(r$7j~lzEPoS)^M{7k)!7?R0)G#~ zpR$@;wbFIkf>&MtV$wcOR?}==1lTKFl7i2;9-~pXPmGp6*pw@~HO)RXxa2f4l#=Yb z%6j9qfU@LGc@>%0;05x+#p(}MVt7{G_;>Nqe`1f5ec^-{wcB0C%+87J9}nL1d=P0Y zae0#sn_wE|1Fm?Sn40*VouUaw0~|^04z$0v=PUKFX3B}bFee24yZg4C0M;u3YPfPA zkTR_$s-1m?}k@@_IlgJpnI3yd9@ z+^u98D5z;JhOBXRfeM2JX=UoPrLus&pzSFQm0pY8T+-by({5AF`sbV^@qr3&*Wzvj z=A@{UOeXiXdk{$K=N z3GP$Cc{uWbI#++`+Ww~x;+og5T?rx1rie?!8)~W~!n{9G^eP^b7a_#6-)ZkUkw;N*{MC9jH1K_RlVE;r^n>k$pwx&`V- zss%zv3G$gWe zv~eDcVzdXp`rUa9290j2RPB8!r0_8SPkcCFiv%)W+ zs=qKt+rcraD$@2eSz~dY4WnV`eLAluCf}nY6Mh`2kXQ=+VTFI2Z8I&D8tLs?knQ|+ zBERtKM6YmR`+SuzQc~X*MkS%mhu@c*@may-zjwJApXKIEzfx+2<;1Nz`C;aVscQH$ zSCO_v&nG(f?yFgnlpO=m{1^ZYm)Vj=4sn={fVdG1dh6`h1v|z89GX#*R3N-mI4xgy zwAvh3+(p6b*r<4AzZeJ_y*`a~SL@jbfT!(3Fy|MJrY<3NWOzOtLBB|}Rtc2I;oM*)G-K-JFmQIbSqPP6uT&{ak{=K> z%;X%US2DO?zX#)S>b5CSK3%Oz-O&;;jgQSAra9YrSiABU6f zr!Mk)8l7vd__-B%KR8&kd!vG1T@9TDA3k=UX)W(ndV#{N+WjHIGCt4K7=A&>E6TK5 z3KPNCGX-F{$f3SL{qCwb*}ey|*aW3^fAL-~Y&|hIm>+oT3o;(EBD(WiE|G&OC0CVgvibbw=> zEcLq>9V_Fr>UhTA!%zny`coLv1gagPiPuN-_cBKcdz;Kb1KeU@(c*B*d*+o>bYV3q z@rSPIy8GuJ7Px+D_koKf0=4@Jmfw+tv8#8Rfp+b>$Zt-C!iG_}%uEN1ACV6~i5>Q8 zk{sB$uzGcn0L2a?3qP+OFCvN}sl#Asi~z&X`1@8WNjJq+Nm^hS%2@)2q5D{17@Ed^ z3PY8^Ff{!XhM0h12%)FQ9P=p*DeEQw_()9NDK5qvvYV${=K0Qgbn>fB_0KR=oXz&H zFm(HmFjNZq2dzU^re|dx#$N&Ke;0?8!tfLQqA9AANc1mr4Juj<5L;_kKA8)5`1*&& zW@Ym^uw%e>VblT>L(*S!6OPapTuvg(2CV#osOwc7fR$f+lZb}fr-r{Ozwn0k9liTt zq&H1v!cNTXJ7=7vJQhGfbzh*Mx+UDJ9Eb68M0z)YNJy?r)@!=Mt&Te~-i!Am=zj^S zV?PP1X8;A&eRu1Wo+>|quoz(FH=&;pEuD}}H@p6i-Ymm!y;+E0E4<%hHPip+O~=2} zZ~pHscxJ#aC7EW7X!Mi7;brn044aqOK4&!ruR}K;<{!W)S{qN9JO+KuzbS|YL=>fn z08iz-YS@Q9t_T#bHPU-%&4ABz9I`{EJg%a{uj5pWRO_@$tk_kpq7Jm+(6vg~wUdo( zvuXG!3*Zcq5(ul0q#vJ9?}Edi?Z8+xM!96Pcka-@wT~CfBecJ^fo0WjwGG3e^XZqu zzi3(-Ee9L&O46ZWk1n!TkYgedL_Ua|kx z=^W+`FU0#B`?y(VvJX!C>3IJBXTvvv{KaDhbRKjH=;s=~2nj2U4wKcoYlbF+e7p2? zt>6WIW2$(8XaQ&3CB+0C03koH3@(WAu&4x{`pF>R$HG4CsKf!U>ElVKN|DE0d#&_V z`LNkNp1U47bc{v@9N8igV_KJqQHF$wtlR_VLi%(fdOmxoevOIshB>l_eJ$q46`F6~ zqh$AX!k~t2(+pwI6u|2V9eI~=6}qkP6V>|_NOE<-jYPJpKg^CUpF&fZw{8D^Uot-H zMD4eJpMW_~Au!O4+YZkb$QEgV-s=zaUP`)1Mza1VI-<+6+X@XB$5GIZ}svI zW_ng@EdnG+GIURwYKua45yj1;rA_nd8A(oVgdNlWlr!FMI>Ost ztxkyd0K4yMbxPDZ-oV@{DG}bb{gH|I)@CVNGHy|doSN3Adgw(?eBhT|Z2sm@E($GO zXS?)nimapkNFJb~AGh<@da^F-Y4eQ81wLz%n^rHZ_zlr$`r(B9zZCuO9rxR4{?VpDts505W>%Ip*Qg_wG+T68{ga*MJ;)&_e$g> zNg}JT#!FNHC1Dmela~w)`!G+lx-GAud2jCKr_#I&OR5;)xCP14a-WSR!dZD}dsFDhYThvvf!thX>HN z@s`qAxrMAjkT7XXXRUL&(yOF1Dxe$b(oBWiu@40DgKVl5Z%%Mhlqo8ODK{6P>$u>^ zhTt|-k5}+;$X#6d*=__*2O3p;g<;zkP{wFzY&Riw@oJOosp9=&dx6J!Vv_0S*%s`k z#yP7kfr~}j*_H^OsS+n5-G-yfqc5z&RWTX6GNNERXAXymWrI<%s?`kcFO4~doP?V% zl(QtVS4YG|%Fye-m79Ru=Q}8xrlio?scU+#ZET!8Ol(jn+n>9*jyY;3ZAz)qH*-60 zj{WF)2X+%*p8flc$?~i+>bG?DuOn{qCvibR0nAUa?~(4)|2pC({O1w3BrMNAj=05d z7otN6muEjC0_6c{*7q@3VR#}UI!+*_l4|nGK8r#Vp)Gu~@5sw)h06ljcx$)S^Ljt^ z?~?#@|C$6a!G8860JhAuIZ5RHPyh8Wf3;gG)f;55nXvElDUW-$F+w#_K8DdNFOtC7 z|B?Wf*MPd109?}w`*$-jKQG)f{!*Xm~ zFt30QP0yFax$}&g%LcEjLV{q!ms?GZU81|{HgD?1J{emz*Kuwqrck+pG5!3yi@j~~ ztQD(DAIYU_Rb&x{31{H@BG)P0G@y~1)4;X-LN?`UadzW1h3x~wpRWH|RS6T*za3AB zNB9xJ`&}jzW8?~HArFm@=7wH8%$EvSKF)d~zq9bWSjy_Rsa5nZ1SC=M%`ppFWdt>- zW#N0^hly&udbE*%97-q9FyU0pDg>#`M3pgdur6mGy=@wkrGua9gp-GQRo~l4b}7}I z%+3~%GHc@Y4%@hpN_LOErn&?ITm3B<1-vjql~eE1^0#lia-PzvI9x{3>Us{0uRFJk zEY?C0Un#F9)9uUEacnwk1iMvd*N!JSyqWXSI)=D03A-~IxiZ^vJ$4<5W8dyxHK2y_ zchXg<#th})gfbu)h$1gzO8d6syUGpVUP@HQK-~B6jD?E!+GV zm7{}<(5o3jOob$Yh!x>w_Tf7*cp_rRqoGG9>j?I1sVnVZO4ziPt2-BM3kHO%nRLpJ zX_-}lG0TwE3vYo!(xO=*f0&tIc-De2{<Xr;44|x%VkF1;E72p7rx`U{zQx$Z$TNgRs zCabZzkVAkxN*v;v1}qkw@H7D)q@a51P@IQih9O) z;QSQz)Hdfg2`Q>(ox@4?8++Fm-Xo+aikuK?usy(6JR9sa;w(&c9UtA@enOa(TX5h> zw?Oh!%)a37V)nKF5VNl&vkCd#`xu^8EHeL__r-`utp7t#R);^6QjS|1+fU2ou=#+x z_nlr#ur|$u>e$pL<{c{IsmKs=j*Yh;N5zM>=^oiW1!}xyc3vn>BKDtX{OI@n)^Q~X zw!>58kqPFyS?_!bAego&W<&KnF~0KQsf@r?U0{iT22iIu6@(W z%4ycQe8JA6CByF=hwd&Atx4vZSk;~x5^CmNu%zgg2P8T9HqZWlbVH&I~m^1vjO8}@$8 z3z8#=&(2HWP@SB#w@5AGu&5rbrIR&;>BA!6IL^A^!W{iLW7mj#%p;zbj}l-T#zk@{8*pu@5p<3_Y%wnxxT zI_hlFRz?gd9DO16%P4JweM3R&`=FE1C#w#N$X}sr9QC$*@T=Im_YAleMM{$rqKP{k zbOsbjn<08mGe9R!i8&iB3&A)&Eej*&7zFo{PQtiE-jBR{wPI!@gbhrADJM}hD9or< z7SY|;jBY=g0UW$;3<1hFzkbNxgVEK2&`hAT@ zYiusmN9FI`^#pBhUHIM{M4A5n)OE_5aX)ra(S<2sZ(*jDS$)H`ZkE#;xIVwKleq{8 zh_vEiHb0(waOu)_-?u&fLdbp`2pR|a<{QXMzbRH;6+q#dG>p>D6~9gj+-5 z=p{3RTrh}YZo)3MI062St3ZAJ%tXsONPW4S7s!$xy=we4a=BOLVOW+Rqn(N2*PYTb z49y_#F!uytBP&85NeE|EM2Y!SOZ{&VhG*WMIuMeJ@c;3j2N^ z3siqLo>ovcf`s+`21p8vaMAnJ*w9)qD6};+P^u92iq~p@@2Kxbx|GO}gjgy0{rJ^f z#}CNw`_Dek*7u)Xw%=~pB@dmNKCtX8BWw|TpEVghAV-7T$EBuGkVMUN%170PY*LV>Zz=z3Q5 z!Uc^i2^|7wrNiA({mw3xPULLIGj$MDvbXE%{8pDYjdv+GLN2$@yO1z2W@~woycs@= zT_{e2&!bP@Q!mTml;PHq70+-TeI|hT@oQOW3bz_OL#2`R0~aBEq^h3VdQ62%9mxNI>`uK-0^*PQpPvk zVB246c-Y5pfPQ=6(x+WJO}k?saj{sXD zQ>VtOg*2vr@0((-DI;5F-Bz|bH^TY8 zfl&}#(wcv`9Ix0|l>V-FECd=JcP>kD6m@=%xgpGIA$gl~NoS0`s#8#tOv7^NM+)S{ z!FNen>m!YDXVwV|q3XKQ8T& z8P9qo4_SwNS|A4p^eS@pS@$?6zaYAji|2p6kBK-HV&fxk2$qkkqatQ=OKR3EVVnjz zY!Sa%48P5UTfi?GfLLJt81ZVyp0GeB+!l|Ks762N2DgV=fi+vep<=p8G=fVPEBSE5 zxeyB0jjHo7a`&Ftu(Gd9F>{KoL%v)))4;1kUJ&6V_A&%r@CrqGlqEahq33&h4E>Hr zbVRkFTJ}9~#*bC5dI2siJRP%yD4rGW2UdjQmrRdt&*3qB;in&)FcusxedCE}@RAy* zenIxLpV;j|ZZ@va3@_2bOUNE5_~tU{@gGwliKB)1HMg|T_wQUU%zPZz7O5YG5`_+B|im& zls_L|b9IFbMcc(floUNe*H8$2cUSghgbr$Y8@L2@Cz$(1p%Q5H?=DkuS%tLq0 zRr3K;u>7*__749A^@y4vq$*A>hZsuh>H;!h`wdColN2G@Y!P&-XzfE*% zocGOUTL1h;wYTSuHD`$L1CE*h6&2(5dGwyg1E8;;w*o}{VhE{Sw65```kYgn6vIrJ ztNLpv$&m2sEVAjZDt4BB6!<2MM9OZ1>Wmvx3)Lu^TnssWAXN&YeBm8$N9GSXg2$nB z?W4`6j{?=Oh_uQxr((IWYAGzBz)L1lt7nBuqs;I-OA+ulF86pSY4PS|lQG20iiWz} zH(PcuEbdS{mGbuP=U0-@Fs4F_c&A9l93iVX3)AVLbR7MHSoB`Z)G^!%T1)#~6fpP!+Sq(@@ZTP zoJP$qixP#g`BP$Uq1-%JiOOh)Er_ZG77ril;Ms|aka?&}Yt{vDQ$uwJb=89TA}xje z7S0m#3hIkNd4uyR_k>9nEd)37b@IIci^J-W3&ZrHSt*O0DgwF|Jx6WZM+Lu5yn!~o zrh?_<-A`;Vh4sAl6pXd446u6<_u_mW-5>UKNZ5Kw4=Qizigz{m_> z2QUCQSXcmzuL0~7000FQ{m*w<+ffRd*jZbeI$BcEOIjQJ=a0zPSsOU&8`@FY7#Qi> zI1)Mm=$Pmj2@MRLsDQ-@@RF?c%wSnr{&T-kR7joMh{2GZkwe#rQ6Ip-&cw{Xs>cRk zWjEl^Wj17G&;#n+6aMdS(WDo(GB9*e2M_{(@#%$;HQ|#Ho+5(aTv|I}kE3 zKhcSPVU9`N{iE z%jzvC+YOT~$me_27?m%gQO2aJ5;P4hXT{>8ie&d%F^X``YC!dKs|rj-IU34i zz257^E=wMW#4{*^kBu{UJ1ctAkBmhnXc#>Zt7s5E5Z`E6XF;4{&=i(1$|#WCBT`mr zK~m7$RaOpP(zS8pRQu8KLqOAB)6}HtM*X3&rj_HeqxatF{7n(u20w=oVzgk2ZD(JS z-f~ZC9UaNNf$6!rJo@g7O|kAAr^VNp}!*} znOnPFXM@VEdSNn^5_hO%vLi;&RTpWGi>hK*52dQ4NT1MN1jOy3SXq|>plfdY*( zw>yY5-eqS_Y$cM~alc?tb6V@$BOLufu236&3Rj5bl;F>IC)!ap=_H8nVybO)>Kgq0 zm<5}`_LuSC^7WQOxDBm1t~r`Eg6!!|ttGU>zWLe~>pRdFa-yy;cO)pS-96OkU|%Y^ z`bN0}*0@e8O>r5#Ks@jb zm}O@l!Q2BYx?Y==zbK&#Q<*h}TJ2G}n@7aWy2Opy$I+hq6rd){Kr%?InI;<>G0<-9 zyf!G)kmx_{-GbIo&T)lYT+wAubY)8Ig_7=C0Y_oJVvMgf&i%GB#Piejh(d#-j5K#4 z!_EEO{HK_!#CFN!dP43j=lVtIX6_dKqgA%8<9ovx1!0U^$0t(^yy6qQWHb(#<}PR_~G%s=5t9 zuNWCh#b@5SKd@@e_+xxX<;mGK>29pL=eIZ~`hL*HnlvLhy+C2U-BJ^beS%wW3i=Gx-R|n%M zGI`W0`6}3Oord^QySPHGXCb_I8B`i|HJ4VW)PCWhv9m=`V~x6|9tM}W^FvoMLS=cS zRx9Uu$)R_t7uUUbF(8S@w(!(o0U7sR|qF(>18!Rfn^uv(ja+$wGb8gr~`$1 z3j4gv?i{(iBrB2TG@ovtYS@P^mD9d#ulJ@xV{v*$TWr|<@WSP=2Oqalu(pQjjqKwM z9F6)R7W(RwEb~K=vez% zRN4+_JdaG+nsqjEIoKtn35xOwPOu~Hpd+k$d+0)(lsCPd>naXP(Yc)4m-Z75PFo;)2d_-j#LI$$Zqz?V;Zd3+;84|GHFW&f)cSs7igZF({0M07=Kd+t3K~e(GY} zo@s)JX|mT`UZ9G6D_HWVT@%lqRA1tuU`8NEG=8YYLeUnHXVxpHe4l!+QaM(iNFCrn zqa@dPPRu81-Du2~V#uT5$Fl>H{rXlfn=MA#w#y?qIZS@?F*G)7n96GT5wG|)*mPwG z&MwY0`{+KcB5s;8GDt4fzT-a!_rNhcMjmC$6lN2R=H9+v|I6kCA z&YkmcR;5%O=mD@E1wUAnxh7j0&pXK|+b$}*q40EHNKgCh7_#K%)KNG&`=ejtPVx4N zN!6e|7X_#2KEE&@E2kQ}cnF}RACW&ypqR#2g^5HJiugJdkvh72QdbJu)!h#K>@i#F ziV&2*jQ$W!lq;%9mtwNxMShL;Hq?dkphp^B1z&-Pn*CuSYfMRsnN!|HvRrOGF$gTQ=htua-u1kE5 zqp5L@#lXIr6WU~v^V%H`=sGM9q#EKT#f1kN(FFTjhcVAG1m}<4niC20f=7<-y*A2r z(8j2imtfcHsc8Y~;x;($8%xt_RVDOR?o}TC1a@WhDQeT*9^o~3oIFTq1kRB$)1GeN zZ}TWVW>?oR2#tkq%#XntJ2wQc-vpFT7KnQ^NUW_-l4mr)Pi;a@MjB*eyi2(Fx?QAI zVHBGFwNb?_Kv{D==Bn-tbw@{wJEtLmAJWw}IZz9**j12OPb~+j1yjEhP}K$?UWqd# z;PIY1gghSno@E2(mRHy>E;WiN^}5)B=my1=Uh^?KMp*096z>uF^m#n?Su>Dk@c4*1 hufh6T!2@gWplj#gVrOUs%LwfJumE7m$b_Xu{tv;(`1b$+ literal 0 HcmV?d00001 diff --git "a/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/2. \345\276\256\350\260\203\346\227\245\345\277\227\344\270\216\351\205\215\347\275\256/finetune_msrun_log/scheduler.log" "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/2. \345\276\256\350\260\203\346\227\245\345\277\227\344\270\216\351\205\215\347\275\256/finetune_msrun_log/scheduler.log" new file mode 100644 index 00000000..18de1978 --- /dev/null +++ "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/2. \345\276\256\350\260\203\346\227\245\345\277\227\344\270\216\351\205\215\347\275\256/finetune_msrun_log/scheduler.log" @@ -0,0 +1,5872 @@ +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:499: UserWarning: The value of the smallest subnormal for type is zero. + setattr(self, word, getattr(machar, word).flat[0]) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:89: UserWarning: The value of the smallest subnormal for type is zero. + return self._float_to_str(self.smallest_subnormal) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:499: UserWarning: The value of the smallest subnormal for type is zero. + setattr(self, word, getattr(machar, word).flat[0]) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:89: UserWarning: The value of the smallest subnormal for type is zero. + return self._float_to_str(self.smallest_subnormal) +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:07:40.560.372 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:194] BuildCluster] Topology build timed out., retry(1/200). +[WARNING] DISTRIBUTED(978947,fffd83fff1e0,python):2024-07-30-02:07:41.564.435 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:227] ProcessRegister] The new node: 0(role: MS_WORKER), rank id: 0 is registered successfully. +[WARNING] DISTRIBUTED(978947,fffd83fff1e0,python):2024-07-30-02:07:41.833.710 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:227] ProcessRegister] The new node: 1(role: MS_WORKER), rank id: 1 is registered successfully. +[WARNING] DISTRIBUTED(978947,fffd83fff1e0,python):2024-07-30-02:07:41.890.060 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:227] ProcessRegister] The new node: 2(role: MS_WORKER), rank id: 2 is registered successfully. +[WARNING] DISTRIBUTED(978947,fffd83fff1e0,python):2024-07-30-02:07:43.165.534 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:227] ProcessRegister] The new node: 3(role: MS_WORKER), rank id: 3 is registered successfully. +[WARNING] DISTRIBUTED(978947,fffd83fff1e0,python):2024-07-30-02:07:43.165.600 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:666] ReassignNodeRank] Rank ids are already set by numeric node ids, and this is not CM initialization. No need to reassign them. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:07:43.560.577 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:196] BuildCluster] Cluster is successfully initialized. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:07:43.560.671 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:07:43.560.690 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:07:48.560.848 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:07:48.560.915 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:07:53.561.080 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:07:53.561.157 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:07:58.561.323 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:07:58.561.423 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:08:03.561.585 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:08:03.561.667 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:08:08.561.817 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:08:08.561.896 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:08:13.562.053 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:08:13.562.134 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:08:18.562.288 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:08:18.562.365 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:08:23.562.531 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:08:23.562.605 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:08:28.562.764 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:08:28.562.854 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:08:33.563.017 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:08:33.563.108 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:08:38.563.290 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:08:38.563.384 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:08:43.564.366 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:08:43.564.451 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:08:48.564.633 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:08:48.564.716 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:08:53.565.828 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:08:53.565.913 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:08:58.566.812 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:08:58.566.897 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:09:03.567.763 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:09:03.567.882 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:09:08.568.840 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:09:08.568.927 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:09:13.569.821 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:09:13.569.899 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:09:18.570.895 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:09:18.571.027 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:09:23.571.941 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:09:23.572.023 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:09:28.572.793 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:09:28.572.880 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:09:33.573.822 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:09:33.573.973 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:09:38.574.853 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:09:38.575.000 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:09:43.576.183 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:09:43.576.267 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:09:48.577.256 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:09:48.577.345 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:09:53.578.365 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:09:53.578.441 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:09:58.579.497 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:09:58.579.573 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:10:03.580.638 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:10:03.580.752 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:10:08.580.919 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:10:08.581.008 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:10:13.581.734 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:10:13.581.819 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:10:18.582.503 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:10:18.582.587 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:10:23.583.372 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:10:23.583.476 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:10:28.583.626 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:10:28.583.702 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:10:33.584.433 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:10:33.584.600 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:10:38.585.596 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:10:38.585.731 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:10:43.586.623 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:10:43.586.713 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:10:48.587.682 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:10:48.587.764 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:10:53.588.981 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:10:53.589.118 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:10:58.589.937 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:10:58.590.014 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:11:03.590.934 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:11:03.591.063 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:11:08.592.035 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:11:08.592.159 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:11:13.592.323 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:11:13.592.406 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:11:18.593.355 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:11:18.593.436 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:11:23.594.302 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:11:23.594.386 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:11:28.595.092 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:11:28.595.822 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:11:33.595.982 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:11:33.596.060 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:11:38.597.314 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:11:38.597.392 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:11:43.598.279 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:11:43.598.347 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:11:48.599.421 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:11:48.599.499 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:11:53.600.583 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:11:53.600.649 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:11:58.600.807 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:11:58.600.879 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:12:03.601.045 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:12:03.601.115 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:12:08.602.074 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:12:08.602.152 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:12:13.603.144 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:12:13.603.222 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:12:18.604.290 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:12:18.604.363 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:12:23.604.539 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:12:23.604.616 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:12:28.605.591 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:12:28.605.661 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:12:33.606.668 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:12:33.606.744 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:12:38.607.698 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:12:38.607.776 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:12:43.608.818 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:12:43.608.919 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:12:48.609.081 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:12:48.609.162 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:12:53.610.130 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:12:53.610.240 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:12:58.610.402 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:12:58.610.482 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:13:03.611.437 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:13:03.611.509 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:13:08.612.423 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:13:08.612.506 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:13:13.613.574 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:13:13.613.653 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:13:18.614.648 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:13:18.614.726 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:13:23.615.833 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:13:23.615.902 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:13:28.616.901 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:13:28.616.979 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:13:33.617.190 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:13:33.618.168 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:13:38.618.330 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:13:38.618.403 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:13:43.619.356 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:13:43.619.434 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:13:48.620.421 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:13:48.620.491 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:13:53.621.249 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:13:53.621.325 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:13:58.622.379 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:13:58.622.457 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:14:03.623.311 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:14:03.623.388 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:14:08.623.547 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:14:08.623.622 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:14:13.624.317 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:14:13.624.400 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:14:18.625.061 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:14:18.625.150 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:14:23.626.166 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:14:23.626.245 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:14:28.627.173 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:14:28.627.273 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:14:33.627.437 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:14:33.627.515 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:14:38.628.625 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:14:38.628.702 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:14:43.629.391 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:14:43.629.467 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:14:48.630.677 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:14:48.630.756 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:14:53.631.699 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:14:53.631.774 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:14:58.632.767 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:14:58.632.875 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:15:03.633.036 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:15:03.633.906 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:15:08.634.065 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:15:08.634.142 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:15:13.635.076 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:15:13.635.189 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:15:18.635.950 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:15:18.636.017 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:15:23.636.771 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:15:23.636.906 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:15:28.637.692 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:15:28.637.766 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:15:33.638.704 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:15:33.638.816 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:15:38.639.535 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:15:38.639.626 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:15:43.639.793 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:15:43.639.872 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:15:48.640.883 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:15:48.640.951 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:15:53.641.760 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:15:53.641.854 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:15:58.642.003 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:15:58.642.102 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:16:03.642.258 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:16:03.642.328 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:16:08.643.274 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:16:08.643.338 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:16:13.643.492 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:16:13.643.589 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:16:18.643.745 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:16:18.643.812 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:16:23.644.584 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:16:23.644.726 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:16:28.644.881 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:16:28.644.970 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:16:33.645.128 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:16:33.645.196 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:16:38.646.144 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:16:38.646.213 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:16:43.647.020 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:16:43.647.093 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:16:48.648.076 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:16:48.648.169 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:16:53.648.327 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:16:53.648.393 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:16:58.648.565 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:16:58.648.639 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:17:03.649.398 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:17:03.649.497 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:17:08.649.655 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:17:08.649.732 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:17:13.651.044 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:17:13.651.121 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:17:18.651.921 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:17:18.651.999 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:17:23.652.890 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:17:23.652.966 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:17:28.653.116 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:17:28.653.185 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:17:33.653.339 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:17:33.653.423 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:17:38.654.189 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:17:38.654.265 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:17:43.655.332 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:17:43.655.407 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:17:48.656.425 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:17:48.656.504 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:17:53.657.435 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:17:53.657.562 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:17:58.658.365 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:17:58.658.466 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:18:03.658.629 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:18:03.658.712 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:18:08.660.001 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:18:08.660.087 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:18:13.661.174 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:18:13.661.253 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:18:18.662.463 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:18:18.662.540 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:18:23.663.283 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:18:23.663.360 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:18:28.664.623 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:18:28.664.732 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:18:33.664.882 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:18:33.664.976 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:18:38.665.127 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:18:38.665.202 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:18:43.666.555 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:18:43.666.633 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:18:48.667.538 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:18:48.667.608 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:18:53.668.520 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:18:53.668.610 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:18:58.669.665 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:18:58.669.744 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:19:03.670.811 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:19:03.670.883 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:19:08.671.796 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:19:08.671.897 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:19:13.672.078 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:19:13.672.161 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:19:18.672.326 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:19:18.672.406 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:19:23.673.107 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:19:23.673.182 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:19:28.673.945 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:19:28.674.020 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:19:33.674.822 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:19:33.674.901 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:19:38.675.664 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:19:38.675.738 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:19:43.676.522 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:19:43.676.618 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:19:48.677.575 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:19:48.677.658 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:19:53.678.450 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:19:53.678.565 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:19:58.678.714 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:19:58.678.796 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:20:03.679.482 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:20:03.679.559 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:20:08.680.324 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:20:08.680.400 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:20:13.681.105 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:20:13.681.183 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:20:18.682.008 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:20:18.682.106 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:20:23.682.265 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:20:23.682.342 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:20:28.683.167 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:20:28.683.249 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:20:33.683.987 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:20:33.684.060 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:20:38.684.797 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:20:38.684.874 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:20:43.685.706 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:20:43.685.782 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:20:48.686.532 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:20:48.686.605 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:20:53.687.409 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:20:53.687.510 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:20:58.687.674 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:20:58.687.748 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:21:03.688.626 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:21:03.688.708 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:21:08.689.702 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:21:08.689.782 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:21:13.690.746 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:21:13.690.831 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:21:18.691.745 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:21:18.691.822 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:21:23.692.573 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:21:23.692.655 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:21:28.693.440 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:21:28.693.539 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:21:33.693.696 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:21:33.693.794 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:21:38.693.949 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:21:38.694.027 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:21:43.694.861 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:21:43.694.939 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:21:48.695.730 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:21:48.695.813 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:21:53.696.753 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:21:53.696.831 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:21:58.697.808 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:21:58.698.738 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:22:03.698.897 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:22:03.698.992 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:22:08.699.148 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:22:08.699.220 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:22:13.700.181 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:22:13.700.266 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:22:18.701.214 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:22:18.701.294 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:22:23.702.332 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:22:23.702.414 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:22:28.703.487 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:22:28.703.565 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:22:33.704.449 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:22:33.704.525 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:22:38.705.407 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:22:38.705.507 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:22:43.705.679 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:22:43.705.755 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:22:48.706.598 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:22:48.706.676 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:22:53.707.479 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:22:53.707.549 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:22:58.710.210 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:22:58.710.292 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:23:03.711.250 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:23:03.711.320 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:23:08.712.232 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:23:08.712.321 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:23:13.713.236 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:23:13.713.343 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:23:18.713.529 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:23:18.713.608 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:23:23.714.564 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:23:23.714.678 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:23:28.714.835 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:23:28.714.915 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:23:33.715.082 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:23:33.715.156 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:23:38.716.055 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:23:38.716.137 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:23:43.717.164 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:23:43.717.239 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:23:48.718.253 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:23:48.718.353 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:23:53.718.510 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:23:53.718.583 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:23:58.719.508 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:23:58.719.578 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:24:03.720.408 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:24:03.720.539 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:24:08.721.467 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:24:08.721.546 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:24:13.722.492 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:24:13.722.574 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:24:18.723.491 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:24:18.723.561 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:24:23.724.512 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:24:23.724.596 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:24:28.725.610 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:24:28.725.687 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:24:33.726.644 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:24:33.726.722 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:24:38.727.738 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:24:38.727.811 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:24:43.728.737 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:24:43.728.833 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:24:48.729.010 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:24:48.729.084 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:24:53.729.957 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:24:53.730.036 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:24:58.730.984 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:24:58.731.125 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:25:03.732.175 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:25:03.732.274 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:25:08.732.436 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:25:08.732.521 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:25:13.733.348 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:25:13.733.477 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:25:18.734.423 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:25:18.734.506 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:25:23.735.448 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:25:23.735.532 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:25:28.736.539 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:25:28.736.651 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:25:33.736.812 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:25:33.736.904 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:25:38.737.051 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:25:38.737.131 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:25:43.738.065 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:25:43.738.143 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:25:48.739.060 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:25:48.739.132 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:25:53.739.300 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:25:53.739.375 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:25:58.740.452 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:25:58.740.563 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:26:03.741.403 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:26:03.741.481 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:26:08.742.396 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:26:08.742.497 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:26:13.742.669 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:26:13.742.744 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:26:18.743.642 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:26:18.743.718 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:26:23.744.869 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:26:23.744.953 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:26:28.746.144 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:26:28.746.226 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:26:33.747.334 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:26:33.747.409 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:26:38.748.400 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:26:38.748.522 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:26:43.749.552 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:26:43.749.652 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:26:48.749.816 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:26:48.749.928 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:26:53.750.088 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:26:53.750.185 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:26:58.750.338 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:26:58.750.416 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:27:03.751.413 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:27:03.751.535 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:27:08.752.614 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:27:08.752.691 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:27:13.753.551 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:27:13.753.633 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:27:18.754.541 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:27:18.754.620 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:27:23.755.548 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:27:23.755.620 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:27:28.756.677 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:27:28.756.744 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:27:33.757.684 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:27:33.757.777 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:27:38.757.948 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:27:38.758.028 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:27:43.759.032 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:27:43.759.107 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:27:48.760.051 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:27:48.760.131 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:27:53.761.177 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:27:53.761.248 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:27:58.762.187 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:27:58.762.283 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:28:03.762.451 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:28:03.762.533 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:28:08.763.477 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:28:08.763.545 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:28:13.764.931 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:28:13.765.012 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:28:18.766.146 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:28:18.766.312 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:28:23.766.474 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:28:23.766.549 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:28:28.767.510 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:28:28.767.590 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:28:33.768.511 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:28:33.768.594 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:28:38.769.614 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:28:38.769.688 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:28:43.770.980 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:28:43.771.052 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:28:48.771.994 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:28:48.772.070 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:28:53.773.140 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:28:53.773.223 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:28:58.774.244 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:28:58.774.344 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:29:03.774.487 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:29:03.774.557 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:29:08.775.477 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:29:08.775.555 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:29:13.776.694 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:29:13.776.766 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:29:18.778.155 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:29:18.778.232 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:29:23.779.580 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:29:23.779.657 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:29:28.780.733 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:29:28.780.806 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:29:33.781.700 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:29:33.781.769 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:29:38.782.717 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:29:38.782.796 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:29:43.783.708 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:29:43.783.805 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:29:48.783.964 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:29:48.784.032 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:29:53.785.408 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:29:53.785.475 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:29:58.786.346 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:29:58.786.415 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:30:03.787.527 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:30:03.787.641 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:30:08.788.442 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:30:08.788.514 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:30:13.789.373 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:30:13.789.451 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:30:18.790.411 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:30:18.790.512 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:30:23.790.670 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:30:23.790.779 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:30:28.790.928 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:30:28.790.997 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:30:33.791.959 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:30:33.792.027 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:30:38.793.079 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:30:38.793.146 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:30:43.794.047 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:30:43.794.122 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:30:48.795.161 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:30:48.795.236 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:30:53.796.561 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:30:53.796.691 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:30:58.796.828 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:30:58.796.893 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:31:03.797.060 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:31:03.797.140 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:31:08.798.135 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:31:08.798.209 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:31:13.799.238 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:31:13.799.309 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:31:18.800.209 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:31:18.800.273 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:31:23.801.229 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:31:23.801.298 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:31:28.802.143 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:31:28.802.211 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:31:33.803.594 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:31:33.803.665 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:31:38.804.624 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:31:38.804.719 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:31:43.804.856 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:31:43.804.930 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:31:48.806.002 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:31:48.806.097 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:31:53.806.244 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:31:53.806.317 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:31:58.807.276 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:31:58.807.371 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:32:03.807.521 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:32:03.807.612 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:32:08.807.769 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:32:08.807.840 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:32:13.808.783 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:32:13.808.863 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:32:18.809.858 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:32:18.809.930 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:32:23.810.864 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:32:23.810.934 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:32:28.811.080 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:32:28.811.147 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:32:33.812.175 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:32:33.812.244 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:32:38.813.542 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:32:38.813.635 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:32:43.813.777 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:32:43.813.843 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:32:48.813.996 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:32:48.814.082 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:32:53.814.238 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:32:53.814.312 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:32:58.815.367 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:32:58.815.443 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:33:03.816.463 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:33:03.816.550 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:33:08.817.812 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:33:08.817.891 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:33:13.818.804 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:33:13.818.905 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:33:18.819.054 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:33:18.819.129 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:33:23.820.128 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:33:23.820.207 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:33:28.821.112 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:33:28.821.193 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:33:33.822.530 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:33:33.822.608 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:33:38.823.512 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:33:38.823.590 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:33:43.825.100 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:33:43.825.180 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:33:48.826.175 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:33:48.826.280 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:33:53.826.440 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:33:53.826.552 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:33:58.826.701 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:33:58.826.777 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:34:03.827.744 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:34:03.827.821 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:34:08.828.768 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:34:08.828.841 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:34:13.829.800 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:34:13.829.921 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:34:18.831.075 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:34:18.831.148 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:34:23.832.077 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:34:23.832.178 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:34:28.832.301 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:34:28.832.397 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:34:33.832.563 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:34:33.832.697 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:34:38.833.643 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:34:38.833.719 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:34:43.834.722 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:34:43.834.798 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:34:48.835.800 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:34:48.835.870 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:34:53.837.185 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:34:53.837.258 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:34:58.838.147 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:34:58.838.228 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:35:03.839.310 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:35:03.839.388 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:35:08.840.306 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:35:08.840.450 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:35:13.841.355 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:35:13.841.490 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:35:18.842.471 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:35:18.842.577 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:35:23.842.738 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:35:23.842.809 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:35:28.844.099 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:35:28.844.183 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:35:33.845.061 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:35:33.845.159 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:35:38.845.314 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:35:38.845.395 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:35:43.846.397 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:35:43.846.473 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:35:48.847.464 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:35:48.847.542 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:35:53.848.559 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:35:53.848.653 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:35:58.848.808 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:35:58.848.881 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:36:03.850.189 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:36:03.850.267 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:36:08.851.250 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:36:08.851.355 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:36:13.851.513 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:36:13.851.592 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:36:18.852.577 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:36:18.852.654 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:36:23.853.538 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:36:23.853.616 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:36:28.854.593 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:36:28.854.672 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:36:33.855.945 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:36:33.856.024 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:36:38.856.959 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:36:38.857.028 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:36:43.857.960 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:36:43.858.046 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:36:48.859.022 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:36:48.859.129 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:36:53.859.287 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:36:53.859.363 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:36:58.860.370 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:36:58.860.447 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:37:03.862.022 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:37:03.862.100 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:37:08.863.027 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:37:08.863.110 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:37:13.864.024 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:37:13.864.108 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:37:18.865.051 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:37:18.865.158 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:37:23.865.303 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:37:23.865.409 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:37:28.865.561 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:37:28.865.640 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:37:33.866.590 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:37:33.866.662 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:37:38.867.997 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:37:38.868.071 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:37:43.869.160 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:37:43.869.231 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:37:48.870.245 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:37:48.870.317 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:37:53.871.365 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:37:53.871.443 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:37:58.872.494 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:37:58.872.587 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:38:03.873.645 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:38:03.873.722 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:38:08.874.809 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:38:08.874.888 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:38:13.875.865 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:38:13.875.949 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:38:18.877.194 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:38:18.877.263 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:38:23.878.164 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:38:23.878.244 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:38:28.879.321 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:38:28.879.418 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:38:33.879.581 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:38:33.879.661 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:38:38.880.612 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:38:38.880.692 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:38:43.881.622 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:38:43.881.699 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:38:48.883.045 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:38:48.883.154 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:38:53.883.400 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:38:53.883.536 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:38:58.883.692 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:38:58.883.789 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:39:03.883.948 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:39:03.884.046 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:39:08.884.205 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:39:08.884.310 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:39:13.884.474 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:39:13.884.567 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:39:18.885.828 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:39:18.885.903 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:39:23.886.997 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:39:23.887.066 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:39:28.888.049 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:39:28.888.204 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:39:33.888.383 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:39:33.888.482 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:39:38.888.630 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:39:38.888.732 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:39:43.888.893 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:39:43.888.968 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:39:48.889.942 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:39:48.890.017 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:39:53.891.355 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:39:53.891.432 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:39:58.892.481 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:39:58.892.604 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:40:03.892.764 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:40:03.892.838 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:40:08.893.000 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:40:08.893.072 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:40:13.893.216 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:40:13.893.306 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:40:18.893.467 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:40:18.893.541 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:40:23.893.701 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:40:23.893.773 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:40:28.893.961 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:40:28.894.075 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:40:33.894.230 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:40:33.894.298 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:40:38.894.455 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:40:38.894.526 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:40:43.894.750 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:40:43.894.880 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:40:48.895.040 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:40:48.895.114 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:40:53.895.265 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:40:53.895.357 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:40:58.895.588 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:40:58.895.721 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:41:03.895.878 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:41:03.895.947 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:41:08.896.107 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:41:08.896.174 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:41:13.896.335 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:41:13.896.409 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:41:18.896.578 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:41:18.896.649 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:41:23.896.808 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:41:23.896.888 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:41:28.897.047 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:41:28.897.121 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:41:33.897.282 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:41:33.897.349 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:41:38.897.516 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:41:38.897.584 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:41:43.897.743 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:41:43.897.822 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:41:48.898.002 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:41:48.898.080 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:41:53.899.198 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:41:53.899.273 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:41:58.899.434 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:41:58.899.510 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:42:03.900.562 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:42:03.900.639 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:42:08.902.049 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:42:08.902.131 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:42:13.903.047 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:42:13.903.131 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:42:18.904.068 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:42:18.904.175 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:42:23.904.336 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:42:23.904.418 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:42:28.905.377 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:42:28.905.455 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:42:33.906.372 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:42:33.906.471 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:42:38.906.623 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:42:38.906.697 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:42:43.907.882 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:42:43.907.981 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:42:48.908.143 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:42:48.908.224 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:42:53.909.140 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:42:53.909.220 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:42:58.910.929 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:42:58.911.006 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:43:03.911.821 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:43:03.911.893 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:43:08.912.744 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:43:08.912.833 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:43:13.914.125 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:43:13.914.209 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:43:18.915.159 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:43:18.915.239 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:43:23.916.096 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:43:23.916.177 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:43:28.917.077 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:43:28.917.160 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:43:33.918.060 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:43:33.918.137 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:43:38.918.977 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:43:38.919.059 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:43:43.919.912 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:43:43.920.020 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:43:48.920.185 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:43:48.920.265 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:43:53.921.051 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:43:53.921.154 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:43:58.921.313 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:43:58.921.394 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:44:03.922.292 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:44:03.922.369 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:44:08.923.352 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:44:08.923.434 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:44:13.924.417 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:44:13.924.506 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:44:18.925.230 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:44:18.925.337 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:44:23.925.494 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:44:23.925.605 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:44:28.925.757 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:44:28.925.831 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:44:33.926.713 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:44:33.926.809 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:44:38.926.972 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:44:38.927.051 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:44:43.927.879 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:44:43.927.957 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:44:48.929.225 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:44:48.929.306 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:44:53.930.181 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:44:53.930.283 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:44:58.930.444 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:44:58.930.526 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:45:03.931.431 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:45:03.931.515 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:45:08.932.446 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:45:08.932.519 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:45:13.933.295 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:45:13.933.377 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:45:18.934.286 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:45:18.934.364 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:45:23.935.241 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:45:23.935.323 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:45:28.936.190 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:45:28.936.291 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:45:33.936.456 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:45:33.936.550 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:45:38.937.727 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:45:38.937.806 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:45:43.938.546 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:45:43.938.626 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:45:48.939.548 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:45:48.939.657 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:45:53.939.801 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:45:53.939.880 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:45:58.940.696 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:45:58.940.776 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:46:03.941.675 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:46:03.941.778 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:46:08.941.934 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:46:08.942.013 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:46:13.943.283 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:46:13.943.366 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:46:18.944.191 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:46:18.944.269 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:46:23.945.204 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:46:23.945.284 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:46:28.946.105 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:46:28.946.183 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:46:33.946.997 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:46:33.947.069 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:46:38.947.944 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:46:38.948.041 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:46:43.948.200 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:46:43.948.279 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:46:48.949.258 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:46:48.949.338 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:46:53.950.133 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:46:53.950.205 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:46:58.951.041 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:46:58.951.129 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:47:03.952.055 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:47:03.952.131 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:47:08.953.074 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:47:08.953.146 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:47:13.954.015 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:47:13.954.129 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:47:18.954.291 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:47:18.954.366 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:47:23.955.169 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:47:23.955.238 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:47:28.956.260 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:47:28.956.337 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:47:33.957.231 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:47:33.957.302 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:47:38.958.233 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:47:38.958.368 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:47:43.958.529 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:47:43.958.605 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:47:48.959.505 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:47:48.959.597 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:47:53.959.749 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:47:53.959.825 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:47:58.960.706 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:47:58.960.777 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:48:03.961.653 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:48:03.961.733 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:48:08.962.642 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:48:08.962.713 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:48:13.963.554 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:48:13.963.664 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:48:18.963.814 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:48:18.963.884 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:48:23.964.039 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:48:23.964.121 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:48:28.964.277 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:48:28.964.351 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:48:33.964.511 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:48:33.964.594 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:48:38.964.769 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:48:38.964.840 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:48:43.965.003 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:48:43.965.078 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:48:48.965.236 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:48:48.965.304 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:48:53.965.458 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:48:53.965.534 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:48:58.965.689 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:48:58.965.770 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:49:03.965.929 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:49:03.965.999 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:49:08.966.157 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:49:08.966.224 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:49:13.966.386 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:49:13.966.463 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:49:18.966.620 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:49:18.966.710 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:49:23.966.855 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:49:23.966.923 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:49:28.967.078 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:49:28.967.155 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:49:33.967.317 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:49:33.967.396 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:49:38.967.552 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:49:38.967.626 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:49:43.967.768 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:49:43.967.828 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:49:48.967.986 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:49:48.968.062 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:49:53.968.336 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:49:53.968.521 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:49:58.968.700 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:49:58.968.778 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:50:03.968.944 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:50:03.969.019 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:50:08.969.177 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:50:08.969.259 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:50:13.969.418 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:50:13.969.499 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:50:18.969.658 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:50:18.969.736 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:50:23.969.895 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:50:23.969.971 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:50:28.970.138 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:50:28.970.218 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:50:33.970.375 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:50:33.970.456 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:50:38.970.617 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:50:38.970.694 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:50:43.970.853 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:50:43.970.954 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:50:48.971.102 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:50:48.971.165 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:50:53.971.326 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:50:53.971.398 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:50:58.971.558 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:50:58.971.627 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:51:03.971.786 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:51:03.971.855 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:51:08.972.017 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:51:08.972.086 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:51:13.972.245 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:51:13.972.318 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:51:18.972.480 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:51:18.972.571 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:51:23.972.731 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:51:23.972.813 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:51:28.972.979 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:51:28.973.045 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:51:33.973.202 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:51:33.973.272 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:51:38.973.431 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:51:38.973.496 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:51:43.973.656 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:51:43.973.726 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:51:48.973.872 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:51:48.973.936 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:51:53.974.096 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:51:53.974.174 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:51:58.974.336 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:51:58.974.404 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:52:03.974.565 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:52:03.974.627 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:52:08.974.782 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:52:08.974.860 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:52:13.975.021 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:52:13.975.091 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:52:18.975.251 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:52:18.975.316 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:52:23.975.466 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:52:23.975.532 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:52:28.975.693 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:52:28.975.771 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:52:33.975.920 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:52:33.975.985 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:52:38.976.148 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:52:38.976.222 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:52:43.976.382 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:52:43.976.452 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:52:48.976.628 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:52:48.976.727 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:52:53.976.884 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:52:53.976.953 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:52:58.977.111 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:52:58.977.182 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:53:03.977.343 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:53:03.977.415 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:53:08.977.577 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:53:08.977.654 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:53:13.977.821 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:53:13.977.899 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:53:18.978.054 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:53:18.978.126 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:53:23.978.283 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:53:23.978.354 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:53:28.978.515 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:53:28.978.586 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:53:33.978.762 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:53:33.978.829 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:53:38.978.990 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:53:38.979.067 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:53:43.979.229 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:53:43.979.300 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:53:48.979.456 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:53:48.979.524 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:53:53.979.683 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:53:53.979.757 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:53:58.979.905 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:53:58.979.975 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:54:03.980.137 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:54:03.980.209 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:54:08.980.372 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:54:08.980.443 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:54:13.980.610 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:54:13.980.711 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:54:18.980.871 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:54:18.980.942 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:54:23.981.102 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:54:23.981.170 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:54:28.981.329 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:54:28.981.409 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:54:33.981.576 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:54:33.981.650 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:54:38.981.804 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:54:38.981.865 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:54:43.982.026 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:54:43.982.096 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:54:48.982.257 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:54:48.982.326 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:54:53.982.485 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:54:53.982.549 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:54:58.982.723 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:54:58.982.793 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:55:03.982.956 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:55:03.983.021 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:55:08.983.182 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:55:08.983.247 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:55:13.983.407 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:55:13.983.484 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:55:18.983.634 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:55:18.983.699 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:55:23.983.855 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:55:23.983.929 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:55:28.984.090 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:55:28.984.163 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:55:33.984.330 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:55:33.984.396 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:55:38.984.556 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:55:38.984.647 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:55:43.984.793 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:55:43.984.862 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:55:48.985.027 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:55:48.985.098 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:55:53.985.258 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:55:53.985.327 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:55:58.985.484 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:55:58.985.555 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:56:03.985.711 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:56:03.985.781 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:56:08.985.928 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:56:08.986.002 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:56:13.986.167 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:56:13.986.247 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:56:18.986.411 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:56:18.986.512 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:56:23.986.672 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:56:23.986.748 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:56:28.986.909 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:56:28.986.985 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:56:33.987.151 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:56:33.987.231 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:56:38.987.389 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:56:38.987.470 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:56:43.987.623 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:56:43.987.695 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:56:48.987.856 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:56:48.987.935 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:56:53.988.095 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:56:53.988.170 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:56:58.988.337 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:56:58.988.415 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:57:03.988.598 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:57:03.988.672 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:57:08.988.818 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:57:08.988.886 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:57:13.989.049 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:57:13.989.138 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:57:18.989.298 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:57:18.989.367 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:57:23.989.522 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:57:23.989.599 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:57:28.989.754 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:57:28.989.827 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:57:33.989.989 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:57:33.990.066 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:57:38.990.227 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:57:38.990.303 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:57:43.990.462 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:57:43.990.557 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:57:48.990.704 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:57:48.990.771 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:57:53.990.933 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:57:53.991.006 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:57:58.991.167 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:57:58.991.245 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:58:03.991.396 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:58:03.991.466 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:58:08.991.621 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:58:08.991.695 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:58:13.991.857 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:58:13.991.935 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:58:18.992.095 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:58:18.992.168 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:58:23.992.331 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:58:23.992.412 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:58:28.992.594 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:58:28.992.669 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:58:33.992.828 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:58:33.992.895 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:58:38.993.054 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:58:38.993.130 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:58:43.993.286 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:58:43.993.353 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:58:48.993.518 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:58:48.993.592 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:58:53.993.746 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:58:53.993.810 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:58:58.993.974 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:58:58.994.050 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:59:03.994.212 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:59:03.994.275 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:59:08.994.434 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:59:08.994.525 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:59:13.994.684 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:59:13.994.749 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:59:18.994.908 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:59:18.994.973 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:59:23.995.118 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:59:23.995.193 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:59:28.995.355 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:59:28.995.431 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:59:33.995.594 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:59:33.995.684 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:59:38.995.853 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:59:38.995.931 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:59:43.996.094 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:59:43.996.187 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:59:48.996.346 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:59:48.996.432 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:59:53.996.631 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:59:53.996.711 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:59:58.996.883 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-02:59:58.996.959 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:00:03.997.119 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:00:03.997.198 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:00:08.997.349 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:00:08.997.424 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:00:13.997.584 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:00:13.997.660 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:00:18.997.814 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:00:18.997.892 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:00:23.998.044 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:00:23.998.118 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:00:28.998.278 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:00:28.998.347 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:00:33.998.542 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:00:33.998.615 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:00:38.998.772 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:00:38.998.846 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:00:43.999.006 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:00:43.999.088 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:00:48.999.244 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:00:48.999.312 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:00:53.999.460 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:00:53.999.526 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:00:58.999.689 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:00:58.999.761 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:01:03.999.922 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:01:03.999.999 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:01:09.000.154 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:01:09.000.226 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:01:14.000.379 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:01:14.000.467 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:01:19.000.632 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:01:19.000.705 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:01:24.000.868 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:01:24.000.950 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:01:29.001.110 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:01:29.001.181 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:01:34.001.327 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:01:34.001.388 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:01:39.001.548 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:01:39.001.615 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:01:44.001.771 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:01:44.001.844 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:01:49.002.006 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:01:49.002.080 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:01:54.002.228 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:01:54.002.290 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:01:59.002.472 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:01:59.002.551 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:02:04.002.712 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:02:04.002.790 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:02:09.002.935 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:02:09.003.005 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:02:14.003.171 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:02:14.003.249 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:02:19.003.412 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:02:19.003.483 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:02:24.003.643 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:02:24.003.711 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:02:29.003.874 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:02:29.003.942 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:02:34.004.103 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:02:34.004.182 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:02:39.004.332 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:02:39.004.421 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:02:44.004.590 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:02:44.004.667 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:02:49.004.826 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:02:49.004.908 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:02:54.005.069 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:02:54.005.142 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:02:59.005.304 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:02:59.005.382 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:03:04.005.543 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:03:04.005.619 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:03:09.005.781 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:03:09.005.860 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:03:14.006.021 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:03:14.006.093 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:03:19.006.248 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:03:19.006.323 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:03:24.006.504 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:03:24.006.577 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:03:29.006.740 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:03:29.006.821 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:03:34.006.976 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:03:34.007.050 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:03:39.007.197 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:03:39.007.266 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:03:44.007.424 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:03:44.007.501 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:03:49.007.658 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:03:49.007.737 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:03:54.007.899 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:03:54.007.971 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:03:59.008.123 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:03:59.008.196 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:04:04.008.370 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:04:04.008.438 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:04:09.008.602 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:04:09.008.676 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:04:14.008.832 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:04:14.008.910 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:04:19.009.062 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:04:19.009.129 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:04:24.009.272 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:04:24.009.338 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:04:29.009.493 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:04:29.009.556 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:04:34.009.717 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:04:34.009.786 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:04:39.009.946 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:04:39.010.010 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:04:44.010.159 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:04:44.010.252 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:04:49.010.412 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:04:49.010.488 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:04:54.010.650 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:04:54.010.723 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:04:59.010.876 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:04:59.010.953 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:05:04.011.115 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:05:04.011.188 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:05:09.011.350 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:05:09.011.427 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:05:14.011.591 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:05:14.011.667 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:05:19.011.829 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:05:19.011.903 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:05:24.012.059 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:05:24.012.132 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:05:29.012.310 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:05:29.012.391 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:05:34.012.558 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:05:34.012.635 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:05:39.012.791 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:05:39.012.861 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:05:44.013.019 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:05:44.013.090 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:05:49.013.244 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:05:49.013.315 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:05:54.013.470 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:05:54.013.541 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:05:59.013.701 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:05:59.013.779 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:06:04.013.937 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:06:04.014.015 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:06:09.014.161 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:06:09.014.251 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:06:14.014.417 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:06:14.014.491 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:06:19.014.647 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:06:19.014.720 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:06:24.014.867 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:06:24.014.937 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:06:29.015.088 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:06:29.015.157 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:06:34.015.315 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:06:34.015.395 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:06:39.015.555 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:06:39.015.631 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:06:44.015.794 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:06:44.015.872 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:06:49.016.026 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:06:49.016.093 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:06:54.016.270 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:06:54.016.340 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:06:59.016.504 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:06:59.016.594 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:07:04.016.756 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:07:04.016.831 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:07:09.016.989 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:07:09.017.059 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:07:14.017.212 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:07:14.017.290 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:07:19.017.442 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:07:19.017.519 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:07:24.017.682 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:07:24.017.755 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:07:29.017.916 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:07:29.017.997 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:07:34.018.142 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:07:34.018.235 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:07:39.018.395 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:07:39.018.475 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:07:44.018.632 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:07:44.018.707 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:07:49.018.865 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:07:49.018.944 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:07:54.019.103 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:07:54.019.176 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:07:59.019.335 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:07:59.019.414 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:08:04.019.574 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:08:04.019.650 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:08:09.019.812 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:08:09.019.891 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:08:14.020.054 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:08:14.020.155 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:08:19.020.317 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:08:19.020.393 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:08:24.020.566 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:08:24.020.651 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:08:29.020.814 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:08:29.020.895 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:08:34.021.005 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:08:34.021.080 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:08:39.021.240 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:08:39.021.316 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:08:44.021.471 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:08:44.021.547 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:08:49.021.711 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:08:49.021.792 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:08:54.021.958 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:08:54.022.036 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:08:59.022.206 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:08:59.022.276 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:09:04.022.441 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:09:04.022.525 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:09:09.022.692 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:09:09.022.767 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:09:14.022.932 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:09:14.023.011 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:09:19.023.173 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:09:19.023.249 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:09:24.023.407 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:09:24.023.488 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:09:29.023.652 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:09:29.023.731 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:09:34.023.864 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:09:34.023.942 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:09:39.024.096 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:09:39.024.195 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:09:44.024.348 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:09:44.024.428 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:09:49.024.599 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:09:49.024.677 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:09:54.024.839 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:09:54.024.913 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:09:59.025.076 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:09:59.025.144 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:10:04.025.301 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:10:04.025.376 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:10:09.025.539 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:10:09.025.606 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:10:14.025.768 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:10:14.025.843 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:10:19.025.992 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:10:19.026.055 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:10:24.026.232 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:10:24.026.296 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:10:29.026.449 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:10:29.026.516 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:10:34.026.672 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:10:34.026.739 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:10:39.026.895 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:10:39.026.958 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:10:44.027.113 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:10:44.027.179 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:10:49.027.339 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:10:49.027.419 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:10:54.027.576 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:10:54.027.649 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:10:59.027.810 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:10:59.027.885 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:11:04.028.046 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:11:04.028.141 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:11:09.028.301 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:11:09.028.380 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:11:14.028.558 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:11:14.028.629 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:11:19.028.790 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:11:19.028.869 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:11:24.029.026 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:11:24.029.105 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:11:29.029.270 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:11:29.029.338 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:11:34.029.499 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:11:34.029.573 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:11:39.029.733 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:11:39.029.810 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:11:44.029.969 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:11:44.030.047 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:11:49.030.233 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:11:49.030.311 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:11:54.030.474 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:11:54.030.551 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:11:59.030.705 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:11:59.030.788 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:12:04.030.950 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:12:04.031.025 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:12:09.031.174 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:12:09.031.245 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:12:14.031.407 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:12:14.031.483 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:12:19.031.647 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:12:19.031.714 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:12:24.031.869 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:12:24.031.936 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:12:29.032.113 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:12:29.032.193 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:12:34.032.356 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:12:34.032.429 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:12:39.032.599 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:12:39.032.677 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:12:44.032.835 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:12:44.032.912 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:12:49.033.078 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:12:49.033.155 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:12:54.033.300 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:12:54.033.375 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:12:59.033.543 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:12:59.033.622 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:13:04.033.786 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:13:04.033.864 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:13:09.034.026 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:13:09.034.121 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:13:14.034.279 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:13:14.034.352 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:13:19.034.513 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:13:19.034.588 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:13:24.034.770 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:13:24.034.851 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:13:29.035.015 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:13:29.035.092 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:13:34.035.238 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:13:34.035.305 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:13:39.035.466 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:13:39.035.544 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:13:44.035.705 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:13:44.035.781 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:13:49.035.941 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:13:49.036.011 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:13:54.036.181 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:13:54.036.248 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:13:59.036.410 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:13:59.036.483 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:14:04.036.634 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:14:04.036.710 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:14:09.036.870 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:14:09.036.936 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:14:14.037.092 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:14:14.037.170 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:14:19.037.323 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:14:19.037.394 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:14:24.037.546 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:14:24.037.622 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:14:29.037.783 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:14:29.037.848 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:14:34.038.005 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:14:34.038.086 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:14:39.038.227 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:14:39.038.290 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:14:44.038.448 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:14:44.038.520 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:14:49.038.683 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:14:49.038.754 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:14:54.038.910 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:14:54.038.979 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:14:59.039.125 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:14:59.039.183 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:15:04.039.347 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:15:04.039.423 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:15:09.039.579 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:15:09.039.646 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:15:14.039.797 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:15:14.039.870 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:15:19.040.036 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:15:19.040.103 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:15:24.040.263 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:15:24.040.343 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:15:29.040.499 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:15:29.040.582 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:15:34.040.748 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:15:34.040.823 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:15:39.040.974 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:15:39.041.045 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:15:44.041.208 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:15:44.041.285 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:15:49.041.448 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:15:49.041.519 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:15:54.041.676 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:15:54.041.747 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:15:59.041.920 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:15:59.041.997 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:16:04.042.138 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:16:04.042.204 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:16:09.042.358 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:16:09.042.435 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:16:14.042.601 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:16:14.042.676 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:16:19.042.836 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:16:19.042.907 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:16:24.043.062 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:16:24.043.132 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:16:29.043.294 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:16:29.043.365 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:16:34.043.523 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:16:34.043.597 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:16:39.043.747 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:16:39.043.832 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:16:44.043.984 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:16:44.044.054 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:16:49.044.213 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:16:49.044.280 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:16:54.044.442 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:16:54.044.512 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:16:59.044.615 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:16:59.044.681 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:17:04.044.846 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:17:04.044.920 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:17:09.045.077 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:17:09.045.153 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:17:14.045.316 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:17:14.045.391 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:17:19.045.552 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:17:19.045.626 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:17:24.045.800 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:17:24.045.877 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:17:29.046.030 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:17:29.046.098 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:17:34.046.269 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:17:34.046.382 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:17:39.046.545 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:17:39.046.619 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:17:44.046.767 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:17:44.046.838 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:17:49.046.987 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:17:49.047.055 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:17:54.047.217 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:17:54.047.295 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:17:59.047.447 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:17:59.047.515 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:18:04.047.668 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:18:04.047.746 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:18:09.047.895 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:18:09.047.962 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:18:14.048.125 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:18:14.048.206 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:18:19.048.373 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:18:19.048.450 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:18:24.048.621 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:18:24.048.693 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:18:29.048.841 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:18:29.048.902 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:18:34.049.071 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:18:34.049.149 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:18:39.049.306 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:18:39.049.378 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:18:44.049.541 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:18:44.049.615 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:18:49.049.788 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:18:49.049.858 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:18:54.050.006 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:18:54.050.078 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:18:59.050.233 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:18:59.050.310 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:19:04.050.474 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:19:04.050.554 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:19:09.050.711 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:19:09.050.777 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:19:14.050.934 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:19:14.051.009 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:19:19.051.174 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:19:19.051.254 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:19:24.051.411 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:19:24.051.490 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:19:29.051.652 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:19:29.051.748 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:19:34.051.907 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:19:34.051.981 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:19:39.052.141 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:19:39.052.223 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:19:44.052.385 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:19:44.052.461 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:19:49.052.624 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:19:49.052.692 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:19:54.052.841 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:19:54.052.909 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:19:59.053.069 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:19:59.053.143 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:20:04.053.309 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:20:04.053.800 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:20:09.053.961 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:20:09.054.051 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:20:14.054.216 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:20:14.054.289 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:20:19.054.447 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:20:19.054.514 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:20:24.054.675 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:20:24.054.741 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:20:29.054.903 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:20:29.054.976 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:20:34.055.139 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:20:34.055.211 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:20:39.055.357 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:20:39.055.427 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:20:44.055.583 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:20:44.055.657 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:20:49.055.812 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:20:49.055.886 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:20:54.056.066 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:20:54.056.138 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:20:59.056.287 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:20:59.056.358 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:21:04.056.520 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:21:04.056.611 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:21:09.056.769 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:21:09.056.841 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:21:14.056.994 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:21:14.057.072 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:21:19.057.218 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:21:19.057.288 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:21:24.057.451 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:21:24.057.524 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:21:29.057.689 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:21:29.057.771 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:21:34.057.935 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:21:34.058.035 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:21:39.058.194 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:21:39.058.268 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:21:44.058.428 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:21:44.058.500 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:21:49.058.664 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:21:49.058.743 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:21:54.058.902 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:21:54.058.979 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:21:59.059.140 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:21:59.059.209 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:22:04.059.359 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:22:04.059.429 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:22:09.059.590 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:22:09.059.670 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:22:14.059.822 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:22:14.059.900 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:22:19.060.082 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:22:19.060.157 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:22:24.060.315 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:22:24.060.398 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:22:29.060.574 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:22:29.060.650 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:22:34.060.812 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:22:34.060.890 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:22:39.061.049 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:22:39.061.124 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:22:44.061.275 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:22:44.061.348 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:22:49.061.511 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:22:49.061.588 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:22:54.061.746 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:22:54.061.823 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:22:59.061.976 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:22:59.062.063 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:23:04.062.219 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:23:04.062.292 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:23:09.062.449 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:23:09.062.522 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:23:14.062.687 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:23:14.062.770 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:23:19.062.901 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:23:19.062.980 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:23:24.063.128 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:23:24.063.199 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:23:29.063.358 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:23:29.063.435 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:23:34.063.598 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:23:34.063.682 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:23:39.063.842 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:23:39.063.945 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:23:44.064.104 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:23:44.064.179 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:23:49.064.335 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:23:49.064.405 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:23:54.064.574 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:23:54.064.653 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:23:59.064.811 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:23:59.064.892 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:24:04.065.042 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:24:04.065.121 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:24:09.065.274 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:24:09.065.351 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:24:14.065.508 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:24:14.065.584 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:24:19.065.744 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:24:19.065.823 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:24:24.066.008 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:24:24.066.081 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:24:29.066.240 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:24:29.066.316 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:24:34.066.471 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:24:34.066.547 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:24:39.066.705 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:24:39.066.780 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:24:44.066.942 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:24:44.067.024 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:24:49.067.190 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:24:49.067.264 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:24:54.067.417 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:24:54.067.489 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:24:59.067.642 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:24:59.067.720 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:25:04.067.883 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:25:04.067.981 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:25:09.068.132 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:25:09.068.201 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:25:14.068.359 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:25:14.068.435 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:25:19.068.603 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:25:19.068.687 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:25:24.068.847 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:25:24.068.926 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:25:29.069.081 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:25:29.069.158 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:25:34.069.309 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:25:34.069.383 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:25:39.069.548 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:25:39.069.627 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:25:44.069.787 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:25:44.069.865 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:25:49.070.053 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:25:49.070.125 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:25:54.070.276 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:25:54.070.347 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:25:59.070.510 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:25:59.070.581 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:26:04.070.744 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:26:04.070.820 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:26:09.070.982 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:26:09.071.055 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:26:14.071.211 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:26:14.071.280 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:26:19.071.425 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:26:19.071.493 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:26:24.071.648 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:26:24.071.725 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:26:29.071.891 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:26:29.071.997 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:26:34.072.159 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:26:34.072.234 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:26:39.072.387 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:26:39.072.458 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:26:44.072.631 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:26:44.072.706 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:26:49.072.866 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:26:49.072.934 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:26:54.073.087 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:26:54.073.155 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:26:59.073.314 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:26:59.073.380 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:27:04.073.542 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:27:04.073.627 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:27:09.073.789 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:27:09.073.858 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:27:14.074.041 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:27:14.074.115 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:27:19.074.270 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:27:19.074.339 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:27:24.074.498 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:27:24.074.571 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:27:29.074.733 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:27:29.074.802 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:27:34.074.963 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:27:34.075.038 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:27:39.075.196 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:27:39.075.262 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:27:44.075.376 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:27:44.075.458 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:27:49.075.614 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:27:49.075.691 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:27:54.075.871 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:27:54.075.941 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:27:59.076.099 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:27:59.076.178 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:28:04.076.339 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:28:04.076.414 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:28:09.076.587 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:28:09.076.664 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:28:14.076.826 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:28:14.076.913 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:28:19.077.072 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:28:19.077.144 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:28:24.077.303 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:28:24.077.376 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:28:29.077.538 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:28:29.077.619 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:28:34.077.764 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:28:34.077.868 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:28:39.078.027 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:28:39.078.098 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:28:44.078.259 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:28:44.078.335 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:28:49.078.496 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:28:49.078.579 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:28:54.078.736 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:28:54.078.811 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:28:59.078.969 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:28:59.079.045 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:29:04.079.208 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:29:04.079.278 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:29:09.079.425 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:29:09.079.493 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:29:14.079.653 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:29:14.079.727 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:29:19.079.910 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:29:19.079.987 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:29:24.080.146 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:29:24.080.225 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:29:29.080.385 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:29:29.080.450 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:29:34.080.624 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:29:34.080.696 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:29:39.080.849 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:29:39.080.919 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:29:44.081.079 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:29:44.081.162 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:29:49.081.320 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:29:49.081.388 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:29:54.081.549 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:29:54.081.626 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:29:59.081.785 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:29:59.081.878 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:30:04.082.045 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:30:04.082.120 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:30:09.082.270 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:30:09.082.336 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:30:14.082.498 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:30:14.082.577 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:30:19.082.737 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:30:19.082.811 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:30:24.082.971 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:30:24.083.048 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:30:29.083.202 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:30:29.083.270 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:30:34.083.432 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:30:34.083.511 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:30:39.083.668 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:30:39.083.744 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:30:44.083.928 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:30:44.084.004 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:30:49.084.161 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:30:49.084.231 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:30:54.084.379 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:30:54.084.446 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:30:59.084.619 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:30:59.084.696 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:31:04.084.858 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:31:04.084.938 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:31:09.085.094 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:31:09.085.169 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:31:14.085.321 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:31:14.085.387 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:31:19.085.550 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:31:19.085.627 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:31:24.085.788 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:31:24.085.883 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:31:29.086.046 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:31:29.086.123 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:31:34.086.285 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:31:34.086.348 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:31:39.086.507 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:31:39.086.585 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:31:44.086.746 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:31:44.086.823 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:31:49.086.987 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:31:49.087.069 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:31:54.087.225 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:31:54.087.299 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:31:59.087.454 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:31:59.087.534 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:32:04.087.698 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:32:04.087.799 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:32:09.087.959 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:32:09.088.028 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:32:14.088.188 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:32:14.088.265 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:32:19.088.424 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:32:19.088.500 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:32:24.088.620 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:32:24.088.690 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:32:29.088.844 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:32:29.088.921 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:32:34.089.081 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:32:34.089.158 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:32:39.089.308 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:32:39.089.370 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:32:44.089.528 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:32:44.089.601 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:32:49.089.783 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:32:49.089.859 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:32:54.090.011 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:32:54.090.086 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:32:59.090.247 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:32:59.090.327 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:33:04.090.463 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:33:04.090.552 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:33:09.090.712 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:33:09.090.800 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:33:14.090.964 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:33:14.091.047 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:33:19.091.204 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:33:19.091.284 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:33:24.091.439 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:33:24.091.506 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:33:29.091.665 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:33:29.091.767 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:33:34.091.928 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:33:34.091.998 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:33:39.092.156 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:33:39.092.231 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:33:44.092.386 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:33:44.092.462 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:33:49.092.633 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:33:49.092.708 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:33:54.092.851 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:33:54.092.913 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:33:59.093.071 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:33:59.093.152 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:34:04.093.309 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:34:04.093.393 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:34:09.093.538 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:34:09.093.620 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:34:14.093.803 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:34:14.093.884 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:34:19.094.034 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:34:19.094.097 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:34:24.094.256 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:34:24.094.330 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:34:29.094.486 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:34:29.094.563 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:34:34.094.712 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:34:34.094.786 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:34:39.094.935 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:34:39.095.003 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:34:44.095.170 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:34:44.095.255 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:34:49.095.411 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:34:49.095.485 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:34:54.095.645 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:34:54.095.741 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:34:59.095.895 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:34:59.095.970 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:35:04.096.135 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:35:04.096.208 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:35:09.096.368 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:35:09.096.447 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:35:14.096.612 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:35:14.096.688 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:35:19.096.853 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:35:19.096.964 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:35:24.097.127 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:35:24.097.200 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:35:29.098.593 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:35:29.098.678 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:35:34.099.577 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:35:34.099.752 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:35:39.099.898 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:35:39.099.973 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:35:44.100.862 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:35:44.100.941 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:35:49.101.797 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:35:49.101.878 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:35:54.102.773 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:35:54.102.873 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:35:59.103.021 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:35:59.103.099 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:36:04.104.375 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:36:04.104.455 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:36:09.105.473 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:36:09.105.552 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:36:14.105.722 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:36:14.105.808 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:36:19.106.698 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:36:19.106.777 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:36:24.107.697 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:36:24.107.779 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:36:29.108.791 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:36:29.108.877 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:36:34.109.838 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:36:34.109.923 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:36:39.111.147 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:36:39.111.221 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:36:44.112.065 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:36:44.112.142 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:36:49.113.118 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:36:49.113.195 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:36:54.113.977 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:36:54.114.054 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:36:59.115.035 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:36:59.115.827 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:37:04.115.977 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:37:04.116.075 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:37:09.116.228 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:37:09.116.312 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:37:14.117.174 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:37:14.117.262 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:37:19.118.225 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:37:19.118.300 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:37:24.119.168 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:37:24.119.246 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:37:29.120.166 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:37:29.120.247 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:37:34.121.209 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:37:34.121.289 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:37:39.122.169 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:37:39.122.273 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:37:44.122.442 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:37:44.122.517 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:37:49.123.379 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:37:49.123.461 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:37:54.124.426 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:37:54.124.510 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:37:59.125.332 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:37:59.125.413 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:38:04.126.333 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:38:04.126.413 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:38:09.127.265 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:38:09.127.345 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:38:14.128.189 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:38:14.128.278 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:38:19.129.565 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:38:19.129.646 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:38:24.130.564 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:38:24.130.675 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:38:29.130.827 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:38:29.130.904 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:38:34.131.071 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:38:34.131.150 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:38:39.132.078 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:38:39.132.161 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:38:44.132.963 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:38:44.133.076 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:38:49.134.434 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:38:49.134.530 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:38:54.134.690 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:38:54.134.786 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:38:59.134.939 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:38:59.135.017 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:39:04.135.818 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:39:04.135.890 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:39:09.136.077 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:39:09.136.155 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:39:14.137.019 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:39:14.137.145 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:39:19.138.466 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:39:19.138.544 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:39:24.139.368 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:39:24.139.470 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:39:29.139.616 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:39:29.139.688 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:39:34.140.504 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:39:34.140.590 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:39:39.141.561 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:39:39.141.636 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:39:44.141.804 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:39:44.141.881 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:39:49.142.894 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:39:49.142.971 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:39:54.143.896 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:39:54.143.971 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:39:59.145.252 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:39:59.145.349 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:40:04.145.506 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:40:04.145.582 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:40:09.146.389 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:40:09.146.463 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:40:14.147.414 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:40:14.147.497 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:40:19.148.452 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:40:19.148.548 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:40:24.149.499 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:40:24.149.579 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:40:29.150.477 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:40:29.150.585 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:40:34.150.746 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:40:34.150.849 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:40:39.151.012 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:40:39.151.092 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:40:44.151.927 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:40:44.152.000 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:40:49.152.885 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:40:49.152.958 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:40:54.153.125 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:40:54.153.195 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:40:59.154.047 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:40:59.154.125 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:41:04.155.441 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:41:04.155.515 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:41:09.156.335 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:41:09.156.414 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:41:14.157.269 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:41:14.157.349 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:41:19.158.238 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:41:19.158.307 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:41:24.159.217 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:41:24.159.342 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:41:29.159.512 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:41:29.159.596 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:41:34.160.942 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:41:34.161.019 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:41:39.161.901 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:41:39.161.982 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:41:44.162.942 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:41:44.163.021 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:41:49.163.995 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:41:49.164.072 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:41:54.165.009 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:41:54.165.119 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:41:59.165.269 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:41:59.165.344 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:42:04.165.514 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:42:04.165.587 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:42:09.166.907 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:42:09.166.975 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:42:14.167.835 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:42:14.167.908 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:42:19.168.844 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:42:19.168.917 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:42:24.169.931 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:42:24.169.996 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:42:29.170.949 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:42:29.171.022 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:42:34.171.829 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:42:34.171.903 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:42:39.172.084 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:42:39.172.153 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:42:44.173.377 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:42:44.173.447 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:42:49.174.302 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:42:49.174.375 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:42:54.175.315 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:42:54.175.408 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:42:59.175.568 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:42:59.175.641 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:43:04.176.486 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:43:04.176.563 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:43:09.177.459 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:43:09.177.537 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:43:14.178.674 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:43:14.178.753 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:43:19.179.640 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:43:19.179.715 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:43:24.180.576 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:43:24.180.641 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:43:29.181.550 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:43:29.181.625 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:43:34.182.611 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:43:34.182.690 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:43:39.183.700 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:43:39.183.779 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:43:44.184.588 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:43:44.184.672 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:43:49.184.845 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:43:49.184.922 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:43:54.186.316 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:43:54.186.394 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:43:59.187.308 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:43:59.187.404 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:44:04.187.563 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:44:04.187.638 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:44:09.188.634 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:44:09.188.712 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:44:14.189.636 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:44:14.189.722 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:44:19.190.675 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:44:19.190.756 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:44:24.190.923 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:44:24.191.001 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:44:29.192.281 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:44:29.192.354 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:44:34.193.228 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:44:34.193.311 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:44:39.194.268 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:44:39.194.348 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:44:44.195.171 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:44:44.195.252 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:44:49.196.179 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:44:49.196.254 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:44:54.197.201 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:44:54.197.283 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:44:59.198.197 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:44:59.198.274 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:45:04.199.525 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:45:04.199.601 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:45:09.200.485 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:45:09.200.567 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:45:14.201.421 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:45:14.201.498 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:45:19.202.546 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:45:19.202.624 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:45:24.203.480 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:45:24.203.596 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:45:29.203.747 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:45:29.203.854 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:45:34.204.042 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:45:34.204.121 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:45:39.205.492 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:45:39.205.571 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:45:44.206.425 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:45:44.206.498 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:45:49.207.370 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:45:49.207.470 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:45:54.207.614 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:45:54.207.680 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:45:59.208.517 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:45:59.208.607 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:46:04.209.505 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:46:04.209.584 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:46:09.209.762 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:46:09.209.841 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:46:14.211.155 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:46:14.211.226 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:46:19.212.043 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:46:19.212.117 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:46:24.212.995 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:46:24.213.094 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:46:29.213.250 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:46:29.213.332 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:46:34.214.220 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:46:34.214.292 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:46:39.215.228 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:46:39.215.330 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:46:44.215.493 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:46:44.215.571 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:46:49.216.489 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:46:49.216.609 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:46:54.216.778 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:46:54.216.851 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:46:59.217.765 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:46:59.217.843 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:47:04.218.771 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:47:04.218.847 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:47:09.219.820 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:47:09.219.902 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:47:14.220.735 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:47:14.220.813 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:47:19.222.194 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:47:19.222.273 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:47:24.223.149 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:47:24.223.227 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:47:29.224.080 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:47:29.224.191 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:47:34.224.357 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:47:34.224.437 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:47:39.225.291 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:47:39.225.380 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:47:44.225.539 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:47:44.225.623 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:47:49.226.582 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:47:49.226.657 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:47:54.227.949 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:47:54.228.020 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:47:59.228.889 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:47:59.228.963 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:48:04.229.924 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:48:04.230.003 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:48:09.230.825 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:48:09.230.902 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:48:14.231.758 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:48:14.231.831 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:48:19.232.806 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:48:19.232.875 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:48:24.233.638 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:48:24.233.720 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:48:29.235.000 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:48:29.235.082 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:48:34.236.046 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:48:34.236.128 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:48:39.237.038 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:48:39.237.108 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:48:44.238.042 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:48:44.238.117 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:48:49.239.004 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:48:49.239.103 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:48:54.239.261 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:48:54.239.367 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:48:59.239.518 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:48:59.239.586 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:49:04.240.431 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:49:04.240.502 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:49:09.241.419 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:49:09.241.501 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:49:14.242.334 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:49:14.242.416 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:49:19.243.332 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:49:19.243.405 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:49:24.244.293 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:49:24.244.386 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:49:29.244.555 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:49:29.244.637 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:49:34.246.028 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:49:34.246.106 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:49:39.247.023 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:49:39.247.099 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:49:44.247.255 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:49:44.247.326 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:49:49.248.190 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:49:49.248.269 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:49:54.249.066 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:49:54.249.139 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:49:59.250.055 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:49:59.250.148 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:50:04.250.300 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:50:04.250.380 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:50:09.251.603 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:50:09.251.674 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:50:14.252.495 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:50:14.252.585 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:50:19.253.584 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:50:19.253.683 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:50:24.253.840 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:50:24.253.914 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:50:29.254.748 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:50:29.254.822 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:50:34.255.644 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:50:34.255.721 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:50:39.256.555 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:50:39.256.627 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:50:44.257.581 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:50:44.257.659 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:50:49.258.967 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:50:49.259.039 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:50:54.259.944 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:50:54.260.025 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:50:59.260.945 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:50:59.261.021 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:51:04.261.991 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:51:04.262.067 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:51:09.262.990 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:51:09.263.065 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:51:14.264.014 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:51:14.264.101 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:51:19.265.173 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:51:19.265.250 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:51:24.266.496 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:51:24.266.564 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:51:29.267.442 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:51:29.267.520 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:51:34.268.422 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:51:34.268.498 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:51:39.269.331 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:51:39.269.403 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:51:44.270.395 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:51:44.270.468 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:51:49.271.355 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:51:49.271.440 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:51:54.272.365 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:51:54.272.430 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:51:59.273.874 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:51:59.273.948 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:52:04.274.790 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:52:04.274.858 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:52:09.275.802 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:52:09.275.876 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:52:14.276.802 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:52:14.276.915 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:52:19.277.808 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:52:19.277.874 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:52:24.278.730 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:52:24.278.833 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:52:29.278.991 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:52:29.279.071 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:52:34.280.023 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:52:34.280.103 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:52:39.280.977 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:52:39.281.051 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:52:44.281.911 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:52:44.281.981 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:52:49.282.869 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:52:49.282.965 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:52:54.283.112 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:52:54.283.188 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:52:59.284.423 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:52:59.284.516 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:53:04.284.695 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:53:04.284.766 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:53:09.284.956 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:53:09.285.029 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:53:14.285.851 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:53:14.285.919 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:53:19.286.797 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:53:19.286.862 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:53:24.287.728 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:53:24.287.804 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:53:29.288.628 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:53:29.288.700 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:53:34.290.033 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:53:34.290.131 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:53:39.290.290 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:53:39.290.358 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:53:44.290.525 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:53:44.290.596 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:53:49.291.384 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:53:49.292.239 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:53:54.292.398 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:53:54.292.470 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:53:59.293.254 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:53:59.293.322 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:54:04.294.215 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:54:04.294.289 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:54:09.295.549 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:54:09.295.629 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:54:14.296.510 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:54:14.296.651 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:54:19.297.643 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:54:19.297.717 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:54:24.298.640 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:54:24.298.718 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:54:29.299.609 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:54:29.299.685 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:54:34.300.721 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:54:34.300.797 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:54:39.301.722 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:54:39.301.795 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:54:44.303.120 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:54:44.303.211 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:54:49.303.372 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:54:49.303.449 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:54:54.304.479 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:54:54.304.560 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:54:59.305.591 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:54:59.305.698 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:55:04.306.514 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:55:04.306.585 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:55:09.307.500 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:55:09.307.578 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:55:14.308.882 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:55:14.308.961 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:55:19.309.859 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:55:19.309.933 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:55:24.310.870 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:55:24.310.949 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:55:29.312.019 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:55:29.312.097 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:55:34.313.084 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:55:34.313.163 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:55:39.314.095 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:55:39.314.166 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:55:44.315.045 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:55:44.315.113 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:55:49.316.430 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:55:49.316.505 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:55:54.317.411 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:55:54.317.521 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:55:59.317.681 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:55:59.317.758 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:56:04.318.789 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:56:04.318.867 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:56:09.319.754 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:56:09.319.830 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:56:14.320.624 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:56:14.320.696 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:56:19.321.563 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:56:19.321.638 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:56:24.323.077 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:56:24.323.156 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:56:29.325.849 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:56:29.325.931 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:56:34.326.847 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:56:34.326.919 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:56:39.327.870 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:56:39.327.936 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:56:44.328.790 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:56:44.328.861 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:56:49.329.814 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:56:49.329.888 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:56:54.331.104 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:56:54.331.180 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:56:59.332.085 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:56:59.332.160 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:57:04.333.030 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:57:04.333.101 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:57:09.334.019 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:57:09.334.095 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:57:14.334.279 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:57:14.334.354 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:57:19.335.321 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:57:19.335.415 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:57:24.335.574 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:57:24.335.650 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:57:29.336.885 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:57:29.336.965 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:57:34.337.836 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:57:34.337.974 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:57:39.338.906 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:57:39.338.974 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:57:44.339.872 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:57:44.339.944 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:57:49.340.966 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:57:49.341.042 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:57:54.341.982 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:57:54.342.054 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:57:59.342.935 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:57:59.343.006 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:58:04.343.836 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:58:04.343.908 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:58:09.345.207 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:58:09.345.273 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:58:14.346.226 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:58:14.346.298 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:58:19.347.142 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:58:19.347.215 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:58:24.348.088 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:58:24.348.166 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:58:29.349.135 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:58:29.349.255 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:58:34.350.196 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:58:34.350.274 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:58:39.351.237 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:58:39.351.352 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:58:44.352.700 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:58:44.352.798 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:58:49.352.956 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:58:49.353.034 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:58:54.353.919 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:58:54.353.984 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:58:59.354.963 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:58:59.355.038 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:59:04.356.041 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:59:04.356.117 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:59:09.357.015 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:59:09.357.095 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:59:14.358.019 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:59:14.358.096 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:59:19.359.276 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:59:19.359.345 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:59:24.360.244 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:59:24.360.355 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:59:29.360.525 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:59:29.360.618 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:59:34.361.510 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:59:34.361.590 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:59:39.362.716 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:59:39.362.789 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:59:44.363.653 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:59:44.363.731 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:59:49.364.632 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:59:49.364.706 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:59:54.365.944 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:59:54.366.019 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:59:59.366.914 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-03:59:59.366.990 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:00:04.367.893 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:00:04.367.971 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:00:09.368.825 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:00:09.368.926 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:00:14.369.073 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:00:14.369.148 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:00:19.370.466 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:00:19.370.535 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:00:24.371.825 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:00:24.371.898 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:00:29.372.778 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:00:29.372.860 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:00:34.373.744 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:00:34.373.828 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:00:39.374.775 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:00:39.374.843 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:00:44.375.768 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:00:44.375.841 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:00:49.376.715 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:00:49.376.830 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:00:54.376.993 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:00:54.377.069 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:00:59.378.011 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:00:59.378.084 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:01:04.379.151 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:01:04.379.228 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:01:09.379.387 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:01:09.379.469 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:01:14.380.474 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:01:14.380.567 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:01:19.381.592 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:01:19.381.664 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:01:24.382.618 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:01:24.382.702 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:01:29.383.777 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:01:29.383.862 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:01:34.385.208 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:01:34.385.281 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:01:39.386.190 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:01:39.386.254 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:01:44.387.319 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:01:44.387.399 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:01:49.388.339 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:01:49.388.419 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:01:54.389.359 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:01:54.389.437 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:01:59.390.374 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:01:59.390.444 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:02:04.391.463 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:02:04.391.533 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:02:09.392.874 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:02:09.392.952 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:02:14.393.858 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:02:14.393.967 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:02:19.394.131 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:02:19.394.206 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:02:24.395.080 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:02:24.395.156 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:02:29.396.084 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:02:29.396.157 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:02:34.396.946 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:02:34.397.022 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:02:39.398.331 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:02:39.398.406 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:02:44.399.207 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:02:44.399.293 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:02:49.400.172 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:02:49.400.240 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:02:54.401.101 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:02:54.401.205 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:02:59.401.363 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:02:59.401.446 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:03:04.402.310 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:03:04.402.391 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:03:09.403.322 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:03:09.403.404 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:03:14.404.853 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:03:14.404.937 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:03:19.405.840 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:03:19.405.915 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:03:24.406.789 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:03:24.406.869 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:03:29.407.806 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:03:29.407.880 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:03:34.408.613 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:03:34.408.680 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:03:39.409.722 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:03:39.409.792 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:03:44.410.733 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:03:44.410.831 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:03:49.410.984 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:03:49.411.063 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:03:54.411.945 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:03:54.412.020 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:03:59.412.773 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:03:59.412.843 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:04:04.413.795 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:04:04.413.876 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:04:09.414.854 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:04:09.414.934 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:04:14.416.176 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:04:14.416.255 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:04:19.417.136 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:04:19.417.244 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:04:24.417.395 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:04:24.417.476 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:04:29.418.337 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:04:29.418.415 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:04:34.419.215 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:04:34.419.293 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:04:39.420.108 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:04:39.420.186 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:04:44.421.134 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:04:44.421.212 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:04:49.422.177 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:04:49.422.252 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:04:54.423.099 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:04:54.423.177 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:04:59.424.156 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:04:59.424.237 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:05:04.425.629 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:05:04.425.713 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:05:09.426.556 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:05:09.426.632 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:05:14.427.506 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:05:14.427.591 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:05:19.428.429 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:05:19.428.501 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:05:24.429.361 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:05:24.429.440 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:05:29.430.315 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:05:29.430.397 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:05:34.431.324 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:05:34.431.428 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:05:39.431.585 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:05:39.431.663 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:05:44.432.552 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:05:44.432.663 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:05:49.432.818 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:05:49.432.895 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:05:54.433.760 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:05:54.433.841 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:05:59.434.823 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:05:59.434.900 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:06:04.435.755 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:06:04.435.838 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:06:09.436.968 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:06:09.437.052 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:06:14.438.046 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:06:14.438.128 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:06:19.439.032 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:06:19.439.109 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:06:24.439.923 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:06:24.439.998 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:06:29.440.928 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:06:29.441.002 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:06:34.441.819 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:06:34.441.902 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:06:39.443.211 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:06:39.443.289 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:06:44.443.454 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:06:44.443.556 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:06:49.443.720 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:06:49.443.793 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:06:54.443.954 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:06:54.444.030 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:06:59.444.195 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:06:59.444.268 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:07:04.444.429 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:07:04.444.504 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:07:09.444.686 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:07:09.444.757 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:07:14.682.278 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:07:14.682.355 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:07:19.682.795 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:07:19.682.869 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:07:24.696.826 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:07:24.696.898 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:07:29.699.736 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:07:29.705.455 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:07:34.705.616 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:07:34.705.686 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:07:39.705.835 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:07:39.705.903 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:07:44.706.052 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:07:44.706.122 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:07:49.719.312 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:07:49.723.986 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:07:54.724.146 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:07:54.725.443 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:07:59.725.601 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:07:59.725.677 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:08:04.725.826 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:08:04.725.900 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:08:09.743.433 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:08:09.750.096 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:08:14.750.260 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:08:14.750.334 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:08:19.750.490 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:08:19.750.550 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:08:24.750.703 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:08:24.751.840 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:08:29.752.001 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:08:29.757.186 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:08:34.757.366 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:08:34.757.432 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:08:39.757.584 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:08:39.757.656 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:08:44.757.811 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:08:44.757.887 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:08:49.760.970 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:08:49.761.047 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:08:54.761.474 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:08:54.761.554 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:08:59.761.718 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:08:59.761.791 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:09:04.762.610 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:09:04.762.684 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:09:09.764.113 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:09:09.764.194 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:09:14.765.132 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:09:14.765.287 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:09:19.765.437 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:09:19.765.513 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:09:24.766.476 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:09:24.766.556 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:09:29.767.453 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:09:29.767.524 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:09:34.768.442 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:09:34.768.588 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:09:39.769.502 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:09:39.769.581 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:09:44.770.922 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:09:44.771.004 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:09:49.771.969 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:09:49.772.053 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:09:54.773.157 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:09:54.773.236 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:09:59.774.119 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:09:59.774.191 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:10:04.775.162 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:10:04.775.235 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:10:09.776.165 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:10:09.776.240 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:10:14.777.083 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:10:14.777.165 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:10:19.778.651 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:10:19.778.729 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:10:24.779.597 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:10:24.779.687 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:10:29.779.837 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:10:29.779.906 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:10:34.780.072 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:10:34.780.144 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:10:39.780.985 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:10:39.781.053 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:10:44.781.924 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:10:44.782.004 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:10:49.782.889 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:10:49.782.964 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:10:54.784.264 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:10:54.784.335 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:10:59.785.257 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:10:59.785.336 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:11:04.786.304 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:11:04.786.387 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:11:09.787.418 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:11:09.787.499 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:11:14.787.666 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:11:14.787.748 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:11:19.788.694 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:11:19.788.802 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:11:24.788.964 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:11:24.789.042 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:11:29.789.912 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:11:29.789.992 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:11:34.791.497 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:11:34.791.573 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:11:39.792.467 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:11:39.792.550 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:11:44.793.435 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:11:44.793.516 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:11:49.793.680 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:11:49.793.759 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:11:54.794.716 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:11:54.794.784 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:11:59.795.682 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:11:59.795.756 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:12:04.797.081 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:12:04.797.156 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:12:09.798.144 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:12:09.798.223 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:12:14.799.206 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:12:14.799.287 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:12:19.800.521 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:12:19.800.604 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:12:24.800.761 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:12:24.800.835 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:12:29.801.637 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:12:29.801.717 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:12:34.803.171 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:12:34.803.252 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:12:39.804.117 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:12:39.804.186 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:12:44.805.127 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:12:44.805.241 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:12:49.805.389 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:12:49.805.469 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:12:54.806.443 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:12:54.806.570 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:12:59.807.574 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:12:59.807.651 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:13:04.808.702 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:13:04.808.776 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:13:09.810.058 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:13:09.810.131 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:13:14.811.031 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:13:14.811.107 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:13:19.812.016 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:13:19.812.083 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:13:24.812.902 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:13:24.812.975 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:13:29.813.156 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:13:29.813.227 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:13:34.814.162 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:13:34.814.278 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:13:39.815.220 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:13:39.815.301 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:13:44.816.750 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:13:44.816.829 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:13:49.817.771 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:13:49.817.854 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:13:54.818.822 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:13:54.818.901 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:13:59.819.916 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:13:59.820.027 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:14:04.820.174 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:14:04.820.243 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:14:09.821.159 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:14:09.821.275 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:14:14.821.438 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:14:14.821.519 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:14:19.822.482 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:14:19.822.556 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:14:24.823.469 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:14:24.823.538 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:14:29.824.475 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:14:29.824.559 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:14:34.825.440 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:14:34.825.522 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:14:39.826.487 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:14:39.826.564 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:14:44.827.544 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:14:44.827.621 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:14:49.828.888 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:14:49.828.992 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:14:54.829.154 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:14:54.829.257 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:14:59.830.140 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:14:59.830.213 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:15:04.831.103 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:15:04.831.181 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:15:09.832.040 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:15:09.832.118 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:15:14.833.048 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:15:14.833.126 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:15:19.834.092 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:15:19.834.170 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:15:24.835.522 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:15:24.835.595 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:15:29.836.483 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:15:29.836.567 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:15:34.837.425 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:15:34.837.496 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:15:39.838.464 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:15:39.838.536 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:15:44.839.537 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:15:44.839.617 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:15:49.840.505 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:15:49.840.598 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:15:54.841.650 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:15:54.841.728 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:15:59.843.137 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:15:59.843.212 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:16:04.844.117 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:16:04.844.195 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:16:09.845.026 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:16:09.845.106 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:16:14.845.959 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:16:14.846.062 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:16:19.846.230 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:16:19.846.304 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:16:24.847.121 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:16:24.847.203 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:16:29.848.734 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:16:29.848.816 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:16:34.849.870 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:16:34.849.948 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:16:39.850.843 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:16:39.850.919 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:16:44.851.856 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:16:44.851.935 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:16:49.852.928 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:16:49.853.000 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:16:54.854.009 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:16:54.854.084 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:16:59.855.532 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:16:59.855.630 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:17:04.855.778 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:17:04.855.860 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:17:09.856.029 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:17:09.856.107 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:17:14.856.989 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:17:14.857.069 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:17:19.857.968 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:17:19.858.565 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:17:24.858.732 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:17:24.858.848 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:17:29.859.008 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:17:29.859.078 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:17:34.860.033 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:17:34.860.152 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:17:39.860.301 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:17:39.860.397 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:17:44.860.570 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:17:44.860.643 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:17:49.861.658 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:17:49.861.734 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:17:54.862.654 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:17:54.862.727 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:17:59.863.644 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:17:59.863.722 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:18:04.864.592 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:18:04.864.661 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:18:09.866.067 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:18:09.866.139 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:18:14.867.094 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:18:14.867.178 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:18:19.867.329 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:18:19.867.398 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:18:24.868.307 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:18:24.868.384 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:18:29.869.349 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:18:29.869.423 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:18:34.870.227 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:18:34.870.299 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:18:39.871.186 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:18:39.871.260 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:18:44.872.630 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:18:44.872.718 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:18:49.873.731 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:18:49.873.808 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:18:54.873.972 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:18:54.874.049 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:18:59.875.054 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:18:59.875.122 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:19:04.876.106 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:19:04.876.284 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:19:09.877.199 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:19:09.877.277 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:19:14.878.727 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:19:14.878.807 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:19:19.879.803 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:19:19.879.900 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:19:24.880.055 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:19:24.880.132 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:19:29.880.301 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:19:29.880.378 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:19:34.881.290 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:19:34.881.369 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:19:39.882.323 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:19:39.882.398 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:19:44.883.919 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:19:44.884.032 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:19:49.884.191 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:19:49.884.269 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:19:54.885.233 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:19:54.885.315 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:19:59.886.346 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:19:59.886.423 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:20:04.886.615 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:20:04.886.712 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:20:09.887.681 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:20:09.887.774 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:20:14.887.935 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:20:14.888.019 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:20:19.889.378 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:20:19.889.454 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:20:24.890.342 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:20:24.890.422 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:20:29.891.393 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:20:29.891.484 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:20:34.891.644 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:20:34.891.720 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:20:39.891.885 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:20:39.891.967 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:20:44.893.170 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:20:44.893.248 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:20:49.894.088 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:20:49.894.201 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:20:54.895.486 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:20:54.895.562 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:20:59.896.477 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:20:59.896.562 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:21:04.897.430 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:21:04.897.554 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:21:09.897.698 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:21:09.897.794 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:21:14.897.950 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:21:14.898.030 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:21:19.898.190 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:21:19.898.265 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:21:24.899.268 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:21:24.899.349 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:21:29.900.617 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:21:29.900.688 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:21:34.901.545 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:21:34.901.622 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:21:39.902.527 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:21:39.902.648 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:21:44.902.810 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:21:44.902.889 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:21:49.903.827 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:21:49.903.910 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:21:54.904.878 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:21:54.904.955 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:21:59.906.369 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:21:59.906.469 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:22:04.906.637 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:22:04.906.716 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:22:09.907.669 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:22:09.907.750 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:22:14.908.749 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:22:14.908.899 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:22:19.909.882 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:22:19.909.962 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:22:24.910.829 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:22:24.910.913 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:22:29.911.782 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:22:29.911.875 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:22:34.912.050 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:22:34.912.130 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:22:39.913.012 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:22:39.913.095 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:22:44.914.044 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:22:44.914.126 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:22:49.915.021 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:22:49.915.100 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:22:54.916.069 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:22:54.916.151 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:22:59.916.990 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:22:59.917.072 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:23:04.917.978 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:23:04.918.077 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:23:09.918.234 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:23:09.918.316 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:23:14.919.287 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:23:14.919.397 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:23:19.919.542 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:23:19.919.615 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:23:24.920.421 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:23:24.920.516 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:23:29.920.684 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:23:29.920.764 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:23:34.921.594 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:23:34.921.674 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:23:39.923.059 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:23:39.923.137 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:23:44.924.020 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:23:44.924.101 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:23:49.924.948 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:23:49.925.131 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:23:54.925.297 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:23:54.925.370 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:23:59.926.272 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:23:59.926.339 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:24:04.927.381 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:24:04.927.462 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:24:09.927.624 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:24:09.927.696 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:24:14.929.130 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:24:14.929.273 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:24:19.930.046 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:24:19.930.118 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:24:24.930.937 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:24:24.931.021 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:24:29.931.852 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:24:29.931.933 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:24:34.932.888 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:24:34.933.017 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:24:39.933.177 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:24:39.934.103 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:24:44.934.253 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:24:44.934.328 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:24:49.935.676 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:24:49.935.759 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:24:54.936.690 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:24:54.936.773 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:24:59.937.642 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:24:59.937.720 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:25:04.938.527 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:25:04.938.601 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:25:09.939.400 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:25:09.939.479 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:25:14.940.353 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:25:14.940.431 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:25:19.941.384 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:25:19.941.464 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:25:24.942.511 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:25:24.942.585 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:25:29.943.999 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:25:29.944.080 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:25:34.945.104 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:25:34.945.185 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:25:39.946.103 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:25:39.946.180 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:25:44.946.994 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:25:44.947.081 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:25:49.948.349 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:25:49.948.435 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:25:54.948.612 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:25:54.948.692 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:25:59.949.394 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:25:59.949.480 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:26:04.950.865 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:26:04.950.975 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:26:09.951.120 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:26:09.951.194 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:26:14.951.906 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:26:14.951.992 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:26:19.952.935 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:26:19.953.011 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:26:24.953.982 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:26:24.954.064 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:26:29.954.793 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:26:29.954.871 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:26:34.955.670 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:26:34.955.789 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:26:39.957.091 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:26:39.957.174 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:26:44.957.947 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:26:44.958.060 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:26:49.958.208 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:26:49.958.283 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:26:54.959.066 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:26:54.959.169 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:26:59.959.328 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:26:59.959.409 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:27:04.959.572 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:27:04.959.653 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:27:09.961.132 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:27:09.961.205 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:27:14.962.019 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:27:14.962.098 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:27:19.962.829 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:27:19.962.905 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:27:24.963.646 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:27:24.963.726 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:27:29.964.435 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:27:29.964.548 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:27:34.964.695 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:27:34.964.766 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:27:39.966.114 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:27:39.966.194 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:27:44.967.039 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:27:44.967.116 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:27:49.967.801 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:27:49.967.882 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:27:54.968.685 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:27:54.968.759 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:27:59.969.449 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:27:59.969.547 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:28:04.969.704 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:28:04.969.823 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:28:09.969.978 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:28:09.970.086 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:28:14.970.244 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:28:14.970.327 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:28:19.971.046 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:28:19.971.131 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:28:24.971.965 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:28:24.972.043 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:28:29.972.788 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:28:29.972.868 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:28:34.973.692 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:28:34.973.778 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:28:39.974.583 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:28:39.974.695 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:28:44.974.855 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:28:44.974.940 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:28:49.975.758 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:28:49.975.837 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:28:54.977.297 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:28:54.977.368 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:28:59.978.049 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:28:59.978.128 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:29:04.978.858 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:29:04.978.935 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:29:09.979.693 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:29:09.979.772 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:29:14.980.517 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:29:14.980.638 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:29:19.980.784 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:29:19.980.859 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:29:24.982.361 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:29:24.982.442 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:29:29.983.209 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:29:29.983.311 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:29:34.983.461 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:29:34.984.122 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:29:39.984.271 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:29:39.984.353 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:29:44.985.074 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:29:44.985.144 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:29:49.985.943 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:29:49.986.021 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:29:54.987.475 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:29:54.987.548 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:29:59.988.253 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:29:59.988.328 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:30:04.989.095 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:30:04.989.218 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:30:09.990.080 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:30:09.990.152 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:30:14.991.051 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:30:14.991.125 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:30:19.991.854 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:30:19.991.935 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:30:24.993.346 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:30:24.993.440 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:30:29.993.603 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:30:29.993.685 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:30:34.994.568 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:30:34.994.649 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:30:39.995.402 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:30:39.995.475 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:30:44.996.266 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:30:44.996.333 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:30:49.996.502 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:30:49.996.579 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:30:54.996.747 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:30:54.996.807 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:30:59.996.981 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:30:59.997.069 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:31:04.997.217 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:31:04.997.309 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:31:09.997.468 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:31:09.997.534 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:31:14.997.703 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:31:14.997.831 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:31:19.998.666 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:31:19.998.730 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:31:24.998.895 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:31:24.998.962 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:31:29.999.747 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:31:29.999.810 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:31:34.999.978 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:31:35.000.068 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:31:40.000.224 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:31:40.000.331 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:31:45.000.481 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:31:45.000.554 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:31:50.001.224 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:31:50.001.292 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:31:55.001.461 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:31:55.001.531 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:32:00.001.689 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:32:00.001.756 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:32:05.001.922 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:32:05.001.991 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:32:10.002.155 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:32:10.002.245 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:32:15.002.405 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:32:15.002.476 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:32:20.002.638 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:32:20.002.705 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:32:25.002.893 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:32:25.002.959 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:32:30.003.118 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:32:30.003.189 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:32:35.003.363 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:32:35.003.432 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:32:40.003.602 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:32:40.003.668 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:32:45.003.824 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:32:45.003.888 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:32:50.004.798 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:32:50.004.866 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:32:55.005.022 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:32:55.005.082 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:33:00.005.245 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:33:00.005.307 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:33:05.005.458 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:33:05.005.555 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:33:10.005.714 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:33:10.005.780 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:33:15.005.944 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:33:15.006.008 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:33:20.006.172 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:33:20.006.243 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:33:25.006.407 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:33:25.006.473 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:33:30.006.639 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:33:30.006.713 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:33:35.006.876 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:33:35.007.000 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:33:40.007.165 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:33:40.007.228 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:33:45.007.389 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:33:45.007.459 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:33:50.007.625 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:33:50.007.687 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:33:55.007.848 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:33:55.007.918 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:34:00.008.084 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:34:00.008.146 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:34:05.008.268 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:34:05.008.338 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:34:10.008.508 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:34:10.008.590 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:34:15.008.746 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:34:15.008.816 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:34:20.008.979 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:34:20.009.049 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:34:25.009.212 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:34:25.009.281 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:34:30.009.461 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:34:30.009.554 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:34:35.009.714 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:34:35.009.782 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:34:40.009.948 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:34:40.010.020 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:34:45.010.185 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:34:45.010.260 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:34:50.010.438 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:34:50.010.504 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:34:55.010.664 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:34:55.010.731 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:35:00.010.894 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:35:00.010.960 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:35:05.011.113 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:35:05.011.755 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:35:10.011.918 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:35:10.012.656 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:35:15.012.808 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:35:15.012.879 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:35:20.013.630 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:35:20.013.696 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:35:25.013.863 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:35:25.013.987 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:35:30.014.143 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:35:30.014.212 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:35:35.014.363 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:35:35.014.430 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:35:40.014.590 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:35:40.014.658 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:35:45.014.815 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:35:45.014.887 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:35:50.015.041 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:35:50.015.107 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:35:55.015.284 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:35:55.015.348 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:36:00.015.504 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:36:00.015.583 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:36:05.015.729 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:36:05.015.794 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:36:10.015.946 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:36:10.016.013 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:36:15.016.177 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:36:15.016.265 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:36:20.016.408 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:36:20.016.472 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:36:25.016.626 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:36:25.016.716 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:36:30.016.875 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:36:30.016.947 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:36:35.017.762 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:36:35.017.866 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:36:40.018.019 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:36:40.018.102 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:36:45.018.262 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:36:45.018.326 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:36:50.018.478 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:36:50.018.563 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:36:55.018.715 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:36:55.018.776 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:37:00.018.945 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:37:00.019.013 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:37:05.019.158 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:37:05.019.220 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:37:10.019.388 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:37:10.019.457 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:37:15.019.623 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:37:15.019.695 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:37:20.019.858 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:37:20.019.943 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:37:25.020.089 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:37:25.020.170 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:37:30.020.323 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:37:30.020.413 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:37:35.020.563 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:37:35.020.626 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:37:40.020.788 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:37:40.020.877 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:37:45.021.034 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:37:45.021.120 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:37:50.021.256 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:37:50.021.319 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:37:55.021.482 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:37:55.021.547 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:38:00.021.711 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:38:00.021.834 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:38:05.021.970 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:38:05.022.048 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:38:10.022.204 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:38:10.022.288 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:38:15.022.438 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:38:15.022.505 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:38:20.022.658 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:38:20.022.740 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:38:25.022.894 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:38:25.022.976 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:38:30.023.120 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:38:30.023.183 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:38:35.023.343 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:38:35.023.434 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:38:40.023.598 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:38:40.023.689 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:38:45.023.830 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:38:45.023.891 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:38:50.024.045 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:38:50.024.104 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:38:55.024.264 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:38:55.024.347 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:39:00.024.505 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:39:00.024.581 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:39:05.024.744 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:39:05.024.812 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:39:10.024.969 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:39:10.025.030 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:39:15.025.200 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:39:15.025.273 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:39:20.025.444 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:39:20.025.508 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:39:25.025.685 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:39:25.025.748 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:39:30.025.911 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:39:30.025.970 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:39:35.026.127 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:39:35.026.191 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:39:40.026.357 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:39:40.026.438 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:39:45.026.593 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:39:45.026.678 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:39:50.026.828 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:39:50.026.893 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:39:55.027.051 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:39:55.027.113 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:40:00.027.282 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:40:00.027.348 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:40:05.027.518 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:40:05.028.123 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:40:10.028.284 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:40:10.028.350 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:40:15.028.516 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:40:15.028.589 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:40:20.028.752 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:40:20.028.823 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:40:25.028.986 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:40:25.029.050 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:40:30.029.212 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:40:30.029.280 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:40:35.029.448 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:40:35.029.520 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:40:40.029.681 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:40:40.029.747 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:40:45.029.908 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:40:45.029.977 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:40:50.740.140 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:40:50.740.206 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:40:55.786.943 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:40:55.788.195 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:41:00.788.343 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:41:00.788.404 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:41:05.802.376 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:41:05.803.733 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:41:10.803.891 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:41:10.803.950 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:41:15.804.102 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:41:15.805.605 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:41:20.805.757 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:41:20.805.817 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:41:25.805.977 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:41:25.809.072 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:41:30.809.238 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:41:30.809.323 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:41:35.809.486 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:41:35.812.918 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:41:40.813.068 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:41:40.813.127 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:41:45.835.470 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:41:45.839.865 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:41:50.840.030 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:41:50.840.087 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:41:55.840.242 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:41:55.840.304 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:42:00.840.456 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:42:00.840.513 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:42:05.871.893 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:42:05.873.916 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:42:10.874.073 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:42:10.875.909 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:42:15.876.070 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:42:15.877.547 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:42:20.877.710 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:42:20.877.765 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:42:25.877.918 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:42:25.877.977 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:42:30.878.141 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:42:30.878.208 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:42:35.878.375 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:42:35.878.443 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:42:40.878.671 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:42:40.878.800 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:42:45.878.950 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:42:45.879.015 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:42:50.879.187 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:42:50.879.256 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:42:55.879.462 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:42:55.879.549 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:43:00.879.704 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:43:00.879.774 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:43:05.879.933 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:43:05.879.997 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:43:10.880.811 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:43:10.880.883 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:43:15.881.051 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:43:15.881.123 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:43:20.881.928 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:43:20.881.987 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:43:25.882.159 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:43:25.882.231 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:43:30.882.387 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:43:30.882.441 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:43:35.882.610 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:43:35.882.711 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:43:40.882.905 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:43:40.882.985 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:43:45.883.147 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:43:45.883.208 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:43:50.883.373 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:43:50.883.442 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:43:55.883.615 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:43:55.883.685 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:44:00.883.855 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:44:00.883.945 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:44:05.884.102 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:44:05.884.169 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:44:10.884.329 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:44:10.884.395 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:44:15.884.570 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:44:15.884.640 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:44:20.884.822 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:44:20.884.887 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:44:25.885.052 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:44:25.885.119 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:44:30.885.288 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:44:30.885.358 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:44:35.885.522 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:44:35.885.613 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:44:40.885.774 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:44:40.885.872 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:44:45.886.032 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:44:45.886.100 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:44:50.886.264 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:44:50.886.330 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:44:55.886.481 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:44:55.886.544 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:45:00.886.716 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:45:00.887.360 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:45:05.887.509 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:45:05.887.571 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:45:10.887.734 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:45:10.887.801 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:45:15.888.619 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:45:15.889.455 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:45:20.889.617 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:45:20.889.685 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:45:25.889.854 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:45:25.889.941 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:45:30.890.102 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:45:30.890.165 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:45:35.890.330 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:45:35.890.436 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:45:40.890.565 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:45:40.890.636 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:45:45.890.825 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:45:45.890.891 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:45:50.891.040 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:45:50.891.112 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:45:55.891.275 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:45:55.891.342 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:46:00.891.511 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:46:00.891.596 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:46:05.891.753 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:46:05.891.818 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:46:10.892.019 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:46:10.892.115 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:46:15.892.858 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:46:15.892.924 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:46:20.893.085 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:46:20.893.153 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:46:25.893.335 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:46:25.893.424 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:46:30.893.571 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:46:30.893.631 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:46:35.893.793 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:46:35.893.856 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:46:40.894.020 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:46:40.894.081 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:46:45.894.788 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:46:45.894.852 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:46:50.895.016 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:46:50.895.077 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:46:55.895.241 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:46:55.895.301 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:47:00.895.466 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:47:00.895.528 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:47:05.895.691 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:47:05.895.777 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:47:10.895.929 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:47:10.895.988 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:47:15.896.154 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:47:15.896.215 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:47:20.896.368 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:47:20.896.432 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:47:25.896.602 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:47:25.896.685 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:47:30.896.846 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:47:30.896.916 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:47:35.897.079 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:47:35.897.166 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:47:40.897.331 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:47:40.897.418 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:47:45.897.571 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:47:45.897.637 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:47:50.897.822 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:47:50.897.882 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:47:55.898.047 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:47:55.898.115 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:48:00.898.274 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:48:00.898.347 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:48:05.898.486 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:48:05.898.546 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:48:10.898.716 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:48:10.898.803 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:48:15.898.956 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:48:15.899.022 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:48:20.899.190 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:48:20.899.254 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:48:25.899.415 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:48:25.899.480 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:48:30.899.643 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:48:30.899.742 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:48:35.899.902 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:48:35.899.967 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:48:40.900.126 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:48:40.900.208 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:48:45.900.363 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:48:45.900.448 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:48:50.900.606 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:48:50.900.690 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:48:55.900.850 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:48:55.900.920 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:49:00.901.088 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:49:00.901.157 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:49:05.901.313 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:49:05.901.369 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:49:10.901.538 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:49:10.901.608 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:49:15.901.791 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:49:15.901.861 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:49:20.902.027 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:49:20.902.106 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:49:25.902.256 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:49:25.902.334 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:49:30.902.491 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:49:30.902.577 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:49:35.902.735 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:49:35.902.794 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:49:40.902.957 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:49:40.903.024 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:49:45.903.746 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:49:45.903.859 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:49:50.904.012 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:49:50.904.070 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:49:55.904.251 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:49:55.904.320 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:50:00.904.487 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:50:00.904.585 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:50:05.904.745 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:50:05.904.817 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:50:10.905.514 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:50:10.905.596 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:50:15.905.753 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:50:15.905.823 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:50:20.905.985 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:50:20.906.044 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:50:25.906.212 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:50:25.906.280 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:50:30.906.457 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:50:30.906.556 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:50:35.907.931 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:50:35.908.021 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:50:40.908.170 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:50:40.908.235 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:50:45.908.394 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:50:45.908.459 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:50:50.908.625 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:50:50.908.694 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:50:55.908.846 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:50:55.908.911 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:51:00.909.595 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:51:00.909.656 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:51:05.909.827 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:51:05.909.898 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:51:10.910.139 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:51:10.910.260 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:51:15.910.420 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:51:15.910.491 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:51:20.910.680 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:51:20.910.745 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:51:25.910.910 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:51:25.911.039 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:51:30.911.180 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:51:30.911.247 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:51:35.911.396 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:51:35.911.513 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:51:40.911.680 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:51:40.911.745 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:51:45.911.912 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:51:45.912.001 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:51:50.912.163 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:51:50.912.225 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:51:55.912.391 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:51:55.912.457 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:52:00.912.631 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:52:00.913.246 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:52:05.913.406 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:52:05.913.509 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:52:10.913.678 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:52:10.913.769 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:52:15.913.919 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:52:15.913.983 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:52:20.914.133 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:52:20.914.189 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:52:25.914.353 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:52:25.914.437 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:52:30.914.609 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:52:30.914.696 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:52:35.914.858 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:52:35.914.915 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:52:40.915.073 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:52:40.915.137 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:52:45.915.317 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:52:45.915.379 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:52:50.915.536 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:52:50.915.596 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:52:55.915.757 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:52:55.915.815 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:53:00.915.958 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:53:00.916.015 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:53:05.916.177 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:53:05.916.246 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:53:10.916.404 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:53:10.916.463 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:53:15.917.234 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:53:15.917.308 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:53:20.917.481 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:53:20.917.549 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:53:25.917.718 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:53:25.917.827 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:53:30.917.990 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:53:30.918.051 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:53:35.918.754 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:53:35.918.831 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:53:40.918.999 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:53:40.919.067 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:53:45.919.243 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:53:45.919.307 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:53:50.919.468 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:53:50.919.531 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:53:55.919.687 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:53:55.919.754 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:54:00.919.917 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:54:00.919.978 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:54:05.920.086 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:54:05.920.188 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:54:10.920.350 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:54:10.920.424 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:54:15.920.605 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:54:15.920.670 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:54:20.920.843 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:54:20.920.912 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:54:25.921.073 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:54:25.921.140 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:54:30.921.319 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:54:30.921.385 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:54:35.921.555 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:54:35.921.628 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:54:40.921.788 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:54:40.921.844 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:54:45.922.574 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:54:45.922.646 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:54:50.922.837 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:54:50.922.894 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:54:55.923.648 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:54:55.923.707 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:55:00.924.434 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:55:00.924.503 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:55:05.924.623 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:55:05.924.688 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:55:10.924.860 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:55:10.924.927 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:55:15.925.098 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:55:15.925.162 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:55:20.925.313 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:55:20.925.379 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:55:25.925.540 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:55:25.925.608 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:55:30.925.769 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:55:30.926.458 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:55:35.926.616 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:55:35.926.680 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:55:40.926.848 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:55:40.926.914 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:55:45.927.078 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:55:45.927.173 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:55:50.927.313 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:55:50.927.367 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:55:55.927.538 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:55:55.927.604 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:56:00.927.770 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:56:00.927.858 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:56:05.928.032 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:56:05.928.099 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:56:10.928.252 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:56:10.928.307 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:56:15.928.477 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:56:15.928.560 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:56:20.928.728 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:56:20.928.794 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:56:25.928.956 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:56:25.929.022 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:56:30.929.187 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:56:30.929.249 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:56:35.929.419 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:56:35.929.502 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:56:40.929.661 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:56:40.929.726 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:56:45.929.888 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:56:45.929.954 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:56:50.930.119 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:56:50.930.191 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:56:55.930.356 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:56:55.930.447 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:57:00.930.597 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:57:00.930.661 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:57:05.931.393 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:57:05.931.479 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:57:10.931.630 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:57:10.931.698 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:57:15.931.854 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:57:15.931.916 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:57:20.932.081 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:57:20.932.151 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:57:25.932.322 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:57:25.932.408 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:57:30.932.583 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:57:30.932.647 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:57:35.932.817 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:57:35.932.885 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:57:40.933.069 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:57:40.933.135 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:57:45.933.316 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:57:45.933.445 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:57:50.933.616 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:57:50.933.688 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:57:55.933.857 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:57:55.933.923 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:58:00.934.089 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:58:00.934.153 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:58:05.934.330 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:58:05.934.395 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:58:10.934.562 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:58:10.934.630 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:58:15.934.798 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:58:15.934.906 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:58:20.935.086 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:58:20.935.174 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:58:25.935.333 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:58:25.935.402 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:58:30.935.575 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:58:30.935.649 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:58:35.935.818 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:58:35.935.889 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:58:40.936.056 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:58:40.936.143 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:58:45.936.306 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:58:45.936.394 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:58:50.936.566 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:58:50.936.625 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:58:55.937.348 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:58:55.937.437 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:59:00.937.583 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:59:00.937.677 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:59:05.937.833 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:59:05.937.916 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:59:10.938.075 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:59:10.938.173 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:59:15.938.333 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:59:15.938.404 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:59:20.938.565 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:59:20.938.625 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:59:25.938.792 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:59:25.938.853 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:59:30.939.501 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:59:30.939.586 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:59:35.939.747 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:59:35.939.826 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:59:40.939.985 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:59:40.940.052 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:59:45.940.231 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:59:45.940.323 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:59:50.940.483 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:59:50.940.561 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:59:55.940.729 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-04:59:55.940.801 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:00:00.940.965 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:00:00.941.047 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:00:05.941.195 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:00:05.941.261 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:00:10.941.429 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:00:10.941.519 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:00:15.941.679 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:00:15.941.769 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:00:20.941.930 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:00:20.942.024 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:00:25.942.184 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:00:25.942.285 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:00:30.942.445 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:00:30.942.507 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:00:35.942.679 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:00:35.942.763 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:00:40.942.915 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:00:40.942.994 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:00:45.943.145 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:00:45.943.232 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:00:50.943.393 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:00:50.943.457 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:00:55.943.622 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:00:55.943.723 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:01:00.943.880 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:01:00.943.940 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:01:05.944.099 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:01:05.944.164 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:01:10.944.331 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:01:10.944.386 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:01:15.944.555 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:01:15.944.620 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:01:20.944.773 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:01:20.944.837 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:01:25.945.000 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:01:25.945.065 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:01:30.945.216 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:01:30.945.273 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:01:35.945.436 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:01:35.945.506 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:01:40.945.679 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:01:40.945.748 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:01:45.945.921 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:01:45.946.011 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:01:50.946.186 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:01:50.946.252 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:01:55.946.428 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:01:55.946.506 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:02:00.946.677 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:02:00.946.739 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:02:05.946.906 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:02:05.946.974 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:02:10.947.144 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:02:10.947.207 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:02:15.947.379 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:02:15.947.443 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:02:20.947.606 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:02:20.947.674 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:02:25.947.843 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:02:25.947.902 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:02:30.948.074 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:02:30.948.179 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:02:35.948.338 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:02:35.948.402 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:02:40.948.578 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:02:40.948.676 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:02:45.948.837 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:02:45.948.896 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:02:50.949.064 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:02:50.949.131 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:02:55.949.289 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:02:55.949.346 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:03:00.949.514 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:03:00.949.595 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:03:05.949.755 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:03:05.949.839 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:03:10.949.996 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:03:10.950.064 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:03:15.950.825 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:03:15.950.885 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:03:20.951.051 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:03:20.951.136 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:03:25.951.301 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:03:25.951.361 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:03:30.951.528 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:03:30.951.614 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:03:35.951.776 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:03:35.951.844 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:03:40.952.012 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:03:40.952.082 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:03:45.952.249 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:03:45.952.311 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:03:50.952.478 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:03:50.952.556 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:03:55.952.724 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:03:55.952.831 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:04:00.952.985 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:04:00.953.066 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:04:05.953.229 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:04:05.953.296 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:04:10.953.456 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:04:10.953.527 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:04:15.953.695 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:04:15.953.758 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:04:20.954.646 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:04:20.954.725 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:04:25.954.886 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:04:25.954.944 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:04:30.955.113 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:04:30.955.198 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:04:35.955.359 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:04:35.955.442 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:04:40.955.604 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:04:40.955.685 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:04:45.955.849 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:04:45.955.909 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:04:50.956.079 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:04:50.956.167 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:04:55.956.328 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:04:55.956.435 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:05:00.956.605 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:05:00.956.703 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:05:05.956.868 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:05:05.956.941 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:05:10.957.109 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:05:10.957.196 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:05:15.957.354 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:05:15.957.423 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:05:20.957.587 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:05:20.957.692 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:05:25.957.853 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:05:25.957.916 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:05:30.958.080 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:05:30.958.150 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:05:35.958.298 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:05:35.958.401 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:05:40.958.556 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:05:40.958.619 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:05:45.958.782 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:05:45.958.849 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:05:50.959.017 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:05:50.959.104 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:05:55.959.238 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:05:55.959.310 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:06:00.959.480 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:06:00.959.588 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:06:05.959.738 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:06:05.959.795 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:06:10.959.962 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:06:10.960.058 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:06:15.960.217 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:06:15.960.283 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:06:20.960.448 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:06:20.960.506 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:06:25.960.629 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:06:25.960.714 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:06:30.960.873 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:06:30.960.940 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:06:35.961.108 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:06:35.961.175 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:06:40.961.330 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:06:40.961.419 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:06:45.961.586 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:06:45.961.647 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:06:50.961.813 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:06:50.961.880 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:06:55.962.047 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:06:55.962.112 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:07:00.962.263 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:07:00.962.326 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:07:05.962.489 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:07:05.962.556 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:07:10.962.713 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:07:10.962.775 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:07:15.962.942 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:07:15.963.033 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:07:20.963.192 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:07:20.963.258 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:07:25.963.422 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:07:25.963.527 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:07:30.963.681 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:07:30.963.740 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:07:35.963.905 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:07:35.963.974 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:07:40.964.131 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:07:40.964.196 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:07:45.964.362 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:07:45.964.425 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:07:50.964.603 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:07:50.964.696 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:07:55.964.849 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:07:55.964.916 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:08:00.965.080 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:08:00.965.149 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:08:05.965.315 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:08:05.965.400 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:08:10.965.567 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:08:10.965.649 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:08:15.965.806 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:08:15.965.873 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:08:20.966.034 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:08:20.966.101 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:08:25.966.265 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:08:25.966.354 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:08:30.966.515 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:08:30.966.585 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:08:35.966.737 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:08:35.966.805 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:08:40.966.967 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:08:40.967.034 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:08:45.967.200 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:08:45.967.269 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:08:50.967.961 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:08:50.968.051 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:08:55.968.200 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:08:55.968.258 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:09:00.968.424 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:09:00.968.488 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:09:05.968.644 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:09:05.968.703 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:09:10.968.867 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:09:10.968.935 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:09:15.969.095 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:09:15.969.160 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:09:20.969.923 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:09:20.969.990 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:09:25.970.156 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:09:25.970.225 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:09:30.970.392 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:09:30.970.477 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:09:35.970.650 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:09:35.970.735 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:09:40.970.893 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:09:40.970.959 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:09:45.972.251 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:09:45.972.314 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:09:50.972.478 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:09:50.972.555 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:09:55.973.278 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:09:55.973.344 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:10:00.973.506 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:10:00.973.568 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:10:05.973.734 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:10:05.973.801 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:10:10.974.573 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:10:10.974.643 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:10:15.974.816 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:10:15.974.913 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:10:20.975.057 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:10:20.975.118 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:10:25.975.286 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:10:25.975.349 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:10:30.975.518 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:10:30.975.589 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:10:35.975.756 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:10:35.975.821 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:10:40.975.978 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:10:40.976.047 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:10:45.976.213 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:10:45.976.282 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:10:50.976.448 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:10:50.976.562 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:10:55.976.724 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:10:55.976.824 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:11:00.976.982 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:11:00.977.050 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:11:05.977.216 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:11:05.977.278 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:11:10.977.437 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:11:10.977.505 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:11:15.977.673 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:11:15.977.741 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:11:20.977.903 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:11:20.977.970 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:11:25.978.123 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:11:25.978.217 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:11:30.978.379 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:11:30.978.447 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:11:35.978.612 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:11:35.978.680 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:11:40.978.860 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:11:40.978.943 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:11:45.979.090 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:11:45.979.151 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:11:50.979.318 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:11:50.979.386 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:11:55.980.070 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:11:55.980.130 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:12:00.980.290 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:12:00.980.376 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:12:05.980.541 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:12:05.980.624 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:12:10.980.782 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:12:10.980.913 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:12:15.981.080 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:12:15.981.145 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:12:20.981.309 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:12:20.981.412 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:12:25.981.577 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:12:25.981.649 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:12:30.981.817 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:12:30.981.890 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:12:35.982.060 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:12:35.982.144 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:12:40.982.322 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:12:40.982.407 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:12:45.982.585 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:12:45.982.645 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:12:50.982.812 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:12:50.982.883 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:12:55.983.056 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:12:55.983.118 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:13:00.983.967 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:13:00.984.029 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:13:05.984.225 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:13:05.984.282 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:13:10.984.445 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:13:10.984.518 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:13:15.984.692 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:13:15.984.759 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:13:20.985.493 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:13:20.985.557 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:13:25.985.732 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:13:25.985.792 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:13:30.985.961 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:13:30.986.021 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:13:35.986.708 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:13:35.986.780 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:13:40.986.949 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:13:40.987.020 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:13:45.987.214 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:13:45.987.287 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:13:50.987.450 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:13:50.987.520 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:13:55.987.681 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:13:55.987.750 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:14:00.987.907 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:14:00.987.977 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:14:05.988.142 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:14:05.988.208 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:14:10.988.367 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:14:10.988.955 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:14:15.989.117 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:14:15.989.190 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:14:20.989.358 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:14:20.990.607 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:14:25.990.756 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:14:25.990.842 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:14:30.990.998 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:14:30.991.059 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:14:35.991.209 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:14:35.991.276 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:14:40.995.704 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:14:41.821.062 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:14:46.821.237 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:14:46.822.411 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:14:51.822.585 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:14:51.822.690 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:14:56.822.845 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:14:56.822.910 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:15:01.844.739 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:15:01.844.811 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:15:06.847.440 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:15:06.852.098 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:15:11.852.286 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:15:11.856.249 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:15:16.856.403 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:15:16.857.734 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:15:21.857.890 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:15:21.866.995 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:15:26.867.154 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:15:26.867.214 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:15:31.867.367 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:15:31.867.432 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:15:36.867.579 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:15:36.867.648 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:15:41.895.607 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:15:41.902.456 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:15:46.902.617 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:15:46.902.684 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:15:51.902.834 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:15:51.902.915 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:15:56.903.057 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:15:56.903.123 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:16:01.923.333 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:16:01.923.399 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:16:06.923.569 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:16:06.923.646 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:16:11.923.806 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:16:11.923.869 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:16:16.924.040 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:16:16.924.118 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:16:21.924.271 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:16:21.924.332 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:16:26.924.549 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:16:26.924.621 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:16:31.924.791 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:16:31.924.860 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:16:36.925.052 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:16:36.925.123 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:16:41.925.289 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:16:41.925.354 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:16:46.925.523 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:16:46.925.590 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:16:51.925.754 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:16:51.925.820 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:16:56.925.981 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:16:56.926.055 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:17:01.926.214 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:17:01.926.275 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:17:06.926.519 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:17:06.926.641 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:17:11.926.810 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:17:11.926.874 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:17:16.927.043 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:17:16.927.156 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:17:21.927.307 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:17:21.927.367 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:17:26.927.528 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:17:26.927.592 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:17:31.927.756 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:17:31.927.835 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:17:36.928.006 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:17:36.928.076 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:17:41.928.249 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:17:41.928.321 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:17:46.928.484 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:17:46.928.567 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:17:51.928.693 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:17:51.928.767 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:17:56.928.936 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:17:56.929.044 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:18:01.929.198 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:18:01.929.269 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:18:06.929.435 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:18:06.929.506 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:18:11.929.677 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:18:11.929.745 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:18:16.929.905 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:18:16.929.966 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:18:21.930.100 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:18:21.930.167 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:18:26.930.334 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:18:26.930.400 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:18:31.930.568 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:18:31.930.639 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:18:36.930.810 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:18:36.930.892 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:18:41.931.070 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:18:41.931.134 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:18:46.931.319 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:18:46.931.468 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:18:51.931.646 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:18:51.931.710 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:18:56.931.879 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:18:56.931.950 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:19:01.932.121 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:19:01.932.187 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:19:06.932.353 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:19:06.932.415 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:19:11.932.586 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:19:11.932.655 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:19:16.932.834 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:19:16.932.903 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:19:21.933.073 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:19:21.933.190 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:19:26.933.349 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:19:26.933.444 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:19:31.933.601 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:19:31.933.669 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:19:36.933.838 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:19:36.933.906 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:19:41.934.139 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:19:41.934.257 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:19:46.934.442 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:19:46.934.521 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:19:51.934.680 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:19:51.934.741 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:19:56.934.911 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:19:56.934.982 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:20:01.935.162 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:20:01.935.236 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:20:06.935.424 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:20:06.935.494 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:20:11.935.662 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:20:11.935.730 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:20:16.935.899 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:20:16.935.970 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:20:21.936.137 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:20:21.936.207 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:20:26.936.377 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:20:26.936.441 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:20:31.936.615 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:20:31.936.687 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:20:36.936.855 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:20:36.936.981 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:20:41.937.147 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:20:41.937.211 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:20:46.937.382 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:20:46.937.484 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:20:51.937.638 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:20:51.937.710 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:20:56.937.865 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:20:56.937.924 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:21:01.938.092 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:21:01.938.167 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:21:06.938.338 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:21:06.938.411 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:21:11.938.582 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:21:11.938.654 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:21:16.938.808 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:21:16.938.881 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:21:21.939.028 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:21:21.939.102 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:21:26.939.270 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:21:26.939.382 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:21:31.939.508 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:21:31.939.565 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:21:36.939.722 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:21:36.939.783 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:21:41.939.956 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:21:41.940.017 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:21:46.940.190 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:21:46.940.254 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:21:51.940.424 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:21:51.940.491 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:21:56.940.628 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:21:56.940.696 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:22:01.940.851 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:22:01.940.909 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:22:06.941.077 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:22:06.941.146 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:22:11.941.338 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:22:11.941.411 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:22:16.941.580 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:22:16.941.653 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:22:21.941.824 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:22:21.941.890 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:22:26.942.052 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:22:26.942.123 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:22:31.942.297 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:22:31.942.367 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:22:36.942.539 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:22:36.942.608 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:22:41.942.768 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:22:41.942.829 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:22:46.943.002 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:22:46.943.071 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:22:51.943.240 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:22:51.943.341 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:22:56.943.505 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:22:56.943.567 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:23:01.943.730 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:23:01.943.794 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:23:06.943.961 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:23:06.944.019 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:23:11.944.188 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:23:11.944.258 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:23:16.944.419 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:23:16.944.484 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:23:21.944.616 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:23:21.944.678 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:23:26.944.845 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:23:26.944.913 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:23:31.945.081 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:23:31.945.150 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:23:36.945.334 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:23:36.945.397 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:23:41.946.721 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:23:41.946.784 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:23:46.946.940 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:23:46.947.003 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:23:51.947.166 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:23:51.947.232 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:23:56.947.400 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:23:56.947.475 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:24:01.947.648 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:24:01.947.720 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:24:06.947.888 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:24:06.947.954 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:24:11.948.112 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:24:11.948.179 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:24:16.948.341 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:24:16.948.443 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:24:21.948.611 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:24:21.948.676 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:24:26.948.846 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:24:26.948.906 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:24:31.949.070 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:24:31.949.146 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:24:36.949.315 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:24:36.949.385 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:24:41.949.547 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:24:41.949.611 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:24:46.949.775 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:24:46.949.844 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:24:51.949.998 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:24:51.950.063 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:24:56.950.235 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:24:56.950.307 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:25:01.950.504 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:25:01.950.572 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:25:06.950.743 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:25:06.950.812 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:25:11.950.981 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:25:11.951.051 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:25:16.951.224 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:25:16.951.294 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:25:21.951.464 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:25:21.951.535 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:25:26.951.702 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:25:26.951.762 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:25:31.951.930 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:25:31.952.002 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:25:36.952.183 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:25:36.952.239 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:25:41.952.427 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:25:41.952.494 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:25:46.952.631 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:25:46.952.700 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:25:51.952.855 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:25:51.952.919 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:25:56.953.088 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:25:56.953.156 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:26:01.953.325 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:26:01.953.387 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:26:06.953.558 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:26:06.953.620 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:26:11.953.775 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:26:11.953.840 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:26:16.954.006 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:26:16.954.087 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:26:21.954.258 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:26:21.955.081 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:26:26.955.240 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:26:26.955.305 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:26:31.955.484 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:26:31.955.649 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:26:36.955.820 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:26:36.955.882 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:26:41.956.058 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:26:41.956.124 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:26:46.956.289 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:26:46.956.357 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:26:51.956.518 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:26:51.956.604 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:26:56.956.766 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:26:56.956.820 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:27:01.956.986 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:27:01.957.044 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:27:06.957.227 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:27:06.957.285 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:27:11.957.450 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:27:11.957.522 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:27:16.957.680 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:27:16.957.737 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:27:21.957.903 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:27:21.957.963 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:27:26.958.135 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:27:26.958.211 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:27:31.958.383 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:27:31.958.453 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:27:36.958.628 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:27:36.958.703 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:27:41.958.878 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:27:41.958.947 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:27:46.959.119 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:27:46.959.233 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:27:51.959.395 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:27:51.959.456 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:27:56.959.632 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:27:56.959.689 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:28:01.959.846 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:28:01.959.916 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:28:06.960.089 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:28:06.960.159 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:28:11.960.330 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:28:11.960.398 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:28:16.960.571 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:28:16.960.637 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:28:21.960.792 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:28:21.960.856 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:28:26.961.024 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:28:26.961.091 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:28:31.961.284 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:28:31.961.352 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:28:36.961.522 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:28:36.961.592 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:28:41.961.756 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:28:41.961.814 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:28:46.961.991 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:28:46.962.063 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:28:51.962.231 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:28:51.962.303 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:28:56.962.469 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:28:56.962.535 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:29:01.962.699 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:29:01.962.768 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:29:06.962.937 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:29:06.963.009 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:29:11.963.199 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:29:11.963.281 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:29:16.963.458 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:29:16.963.532 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:29:21.963.695 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:29:21.963.762 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:29:26.963.922 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:29:26.963.984 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:29:31.964.150 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:29:31.964.221 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:29:36.964.393 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:29:36.964.461 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:29:41.964.617 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:29:41.964.683 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:29:46.964.841 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:29:46.964.911 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:29:51.965.086 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:29:51.965.199 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:29:56.965.360 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:29:56.965.432 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:30:01.965.604 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:30:01.965.679 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:30:06.965.836 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:30:06.965.904 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:30:11.966.078 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:30:11.966.148 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:30:16.966.313 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:30:16.966.386 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:30:21.966.541 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:30:21.966.614 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:30:26.966.791 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:30:26.966.855 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:30:31.967.019 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:30:31.967.088 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:30:36.967.280 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:30:36.967.335 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:30:41.967.506 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:30:41.967.565 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:30:46.967.708 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:30:46.967.778 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:30:51.967.932 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:30:51.967.999 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:30:56.968.169 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:30:56.968.236 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:31:01.968.401 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:31:01.968.468 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:31:06.968.627 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:31:06.968.698 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:31:11.968.861 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:31:11.968.925 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:31:16.969.629 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:31:16.969.736 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:31:21.969.895 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:31:21.969.964 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:31:26.970.135 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:31:26.970.193 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:31:31.970.364 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:31:31.970.438 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:31:36.970.608 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:31:36.970.682 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:31:41.970.860 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:31:41.970.926 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:31:46.971.089 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:31:46.971.157 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:31:51.971.312 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:31:51.971.368 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:31:56.971.542 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:31:56.971.598 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:32:01.971.784 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:32:01.971.842 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:32:06.972.006 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:32:06.972.074 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:32:11.972.233 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:32:11.972.287 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:32:16.972.462 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:32:16.972.525 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:32:21.972.715 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:32:21.972.774 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:32:26.972.941 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:32:26.973.005 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:32:31.973.148 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:32:31.973.210 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:32:36.973.362 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:32:36.973.419 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:32:41.973.589 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:32:41.973.717 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:32:46.973.877 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:32:46.973.946 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:32:51.974.116 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:32:51.974.185 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:32:56.974.346 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:32:56.974.411 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:33:01.974.579 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:33:01.974.649 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:33:06.974.819 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:33:06.974.878 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:33:11.975.044 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:33:11.975.110 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:33:16.975.279 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:33:16.975.357 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:33:21.975.534 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:33:21.975.647 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:33:26.975.811 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:33:26.975.871 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:33:31.976.048 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:33:31.976.121 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:33:36.976.288 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:33:36.976.352 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:33:41.976.539 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:33:41.976.611 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:33:46.976.773 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:33:46.976.837 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:33:51.977.002 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:33:51.977.075 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:33:56.977.246 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:33:56.977.317 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:34:01.977.483 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:34:01.977.550 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:34:06.977.731 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:34:06.977.797 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:34:11.977.968 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:34:11.978.038 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:34:16.978.204 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:34:16.978.274 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:34:21.978.436 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:34:21.978.494 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:34:26.978.671 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:34:26.978.741 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:34:31.978.911 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:34:31.978.982 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:34:36.979.156 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:34:36.979.230 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:34:41.979.393 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:34:41.979.461 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:34:46.979.622 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:34:46.979.730 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:34:51.979.893 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:34:51.979.963 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:34:56.980.134 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:34:56.980.203 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:35:01.980.375 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:35:01.980.454 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:35:06.980.628 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:35:06.980.700 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:35:11.980.877 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:35:11.980.947 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:35:16.981.113 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:35:16.981.186 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:35:21.981.354 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:35:21.981.424 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:35:26.981.581 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:35:26.981.648 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:35:31.981.831 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:35:31.981.900 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:35:36.982.072 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:35:36.982.148 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:35:41.982.310 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:35:41.982.364 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:35:46.982.536 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:35:46.982.605 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:35:51.982.770 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:35:51.982.843 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:35:56.983.009 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:35:56.983.071 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:36:01.983.231 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:36:01.983.303 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:36:06.983.471 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:36:06.983.539 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:36:11.983.707 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:36:11.983.848 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:36:16.984.009 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:36:16.984.071 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:36:21.984.229 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:36:21.984.290 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:36:26.984.450 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:36:26.984.518 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:36:31.985.194 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:36:31.985.251 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:36:36.985.422 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:36:36.985.487 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:36:41.986.164 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:36:41.986.236 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:36:46.986.408 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:36:46.986.483 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:36:51.986.646 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:36:51.986.745 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:36:56.986.944 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:36:56.987.015 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:37:01.987.178 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:37:01.987.247 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:37:06.987.418 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:37:06.987.482 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:37:11.987.635 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:37:11.987.697 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:37:16.987.863 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:37:16.987.939 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:37:21.988.101 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:37:21.988.171 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:37:26.988.328 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:37:26.988.390 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:37:31.988.570 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:37:31.988.639 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:37:36.988.836 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:37:36.988.901 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:37:41.989.072 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:37:41.989.139 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:37:46.989.313 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:37:46.989.381 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:37:51.989.545 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:37:51.989.614 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:37:56.989.789 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:37:56.989.865 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:38:01.990.039 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:38:01.990.116 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:38:06.990.289 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:38:06.990.354 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:38:11.990.520 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:38:11.990.589 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:38:16.990.741 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:38:16.990.839 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:38:21.991.001 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:38:21.991.070 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:38:26.991.245 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:38:26.991.340 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:38:31.991.501 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:38:31.991.576 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:38:36.991.737 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:38:36.991.807 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:38:41.991.979 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:38:41.992.048 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:38:46.992.169 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:38:46.992.231 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:38:51.992.390 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:38:51.992.450 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:38:56.992.619 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:38:56.992.682 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:39:01.992.856 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:39:01.992.911 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:39:06.993.079 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:39:06.993.150 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:39:11.993.319 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:39:11.993.389 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:39:16.993.549 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:39:16.993.613 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:39:21.993.783 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:39:21.993.848 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:39:26.994.016 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:39:26.994.073 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:39:31.994.239 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:39:31.994.300 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:39:36.994.456 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:39:36.994.513 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:39:41.994.672 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:39:41.994.772 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:39:46.994.934 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:39:46.995.006 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:39:51.995.161 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:39:51.995.217 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:39:56.995.384 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:39:56.995.453 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:40:01.995.613 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:40:01.995.676 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:40:06.995.840 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:40:06.995.893 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:40:11.996.070 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:40:11.996.134 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:40:16.996.304 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:40:16.996.381 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:40:21.996.555 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:40:21.996.614 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:40:26.996.796 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:40:26.996.866 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:40:31.997.034 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:40:31.997.110 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:40:36.997.279 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:40:36.997.349 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:40:41.997.506 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:40:41.997.567 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:40:46.997.739 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:40:46.997.804 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:40:51.997.968 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:40:51.998.040 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:40:56.998.215 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:40:56.998.285 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:41:01.998.463 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:41:01.998.529 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:41:06.998.714 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:41:06.998.782 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:41:11.998.951 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:41:11.999.008 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:41:16.999.179 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:41:16.999.239 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:41:21.999.399 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:41:21.999.465 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:41:26.999.581 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:41:26.999.646 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:41:31.999.817 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:41:31.999.881 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:41:37.000.049 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:41:37.000.124 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:41:42.000.294 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:41:42.000.368 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:41:47.000.541 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:41:47.000.638 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:41:52.000.803 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:41:52.000.873 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:41:57.001.042 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:41:57.001.104 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:42:02.001.262 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:42:02.001.339 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:42:07.001.496 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:42:07.001.560 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:42:12.001.733 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:42:12.001.802 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:42:17.001.974 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:42:17.002.045 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:42:22.002.215 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:42:22.002.279 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:42:27.002.452 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:42:27.002.526 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:42:32.002.724 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:42:32.002.789 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:42:37.002.954 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:42:37.003.022 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:42:42.003.189 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:42:42.003.260 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:42:47.003.424 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:42:47.003.481 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:42:52.003.634 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:42:52.003.688 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:42:57.003.851 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:42:57.003.915 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:43:02.004.085 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:43:02.004.156 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:43:07.004.326 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:43:07.004.400 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:43:12.004.577 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:43:12.004.690 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:43:17.004.854 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:43:17.004.917 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:43:22.005.087 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:43:22.005.151 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:43:27.005.314 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:43:27.005.374 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:43:32.005.543 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:43:32.005.617 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:43:37.005.790 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:43:37.005.854 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:43:42.006.024 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:43:42.006.084 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:43:47.006.260 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:43:47.006.336 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:43:52.006.498 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:43:52.006.562 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:43:57.006.758 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:43:57.006.816 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:44:02.006.982 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:44:02.007.053 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:44:07.007.220 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:44:07.007.290 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:44:12.007.450 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:44:12.007.507 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:44:17.007.675 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:44:17.007.749 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:44:22.007.907 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:44:22.007.975 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:44:27.008.150 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:44:27.008.211 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:44:32.008.382 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:44:32.008.455 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:44:37.008.598 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:44:37.008.705 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:44:42.008.839 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:44:42.008.907 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:44:47.009.070 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:44:47.009.139 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:44:52.009.305 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:44:52.009.374 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:44:57.009.531 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:44:57.009.595 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:45:02.009.772 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:45:02.009.843 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:45:07.010.027 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:45:07.010.096 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:45:12.010.261 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:45:12.010.322 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:45:17.010.487 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:45:17.010.598 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:45:22.010.762 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:45:22.010.824 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:45:27.010.998 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:45:27.011.060 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:45:32.011.228 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:45:32.011.307 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:45:37.011.475 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:45:37.011.537 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:45:42.011.705 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:45:42.011.773 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:45:47.011.944 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:45:47.012.017 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:45:52.012.182 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:45:52.012.244 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:45:57.012.415 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:45:57.012.475 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:46:02.012.626 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:46:02.012.694 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:46:07.012.863 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:46:07.012.940 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:46:12.013.104 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:46:12.013.163 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:46:17.013.336 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:46:17.013.410 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:46:22.013.576 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:46:22.013.645 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:46:27.013.813 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:46:27.013.884 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:46:32.014.056 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:46:32.014.126 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:46:37.014.296 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:46:37.014.359 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:46:42.014.517 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:46:42.014.631 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:46:47.014.791 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:46:47.014.849 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:46:52.015.018 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:46:52.015.078 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:46:57.015.250 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:46:57.015.307 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:47:02.015.477 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:47:02.015.539 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:47:07.015.699 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:47:07.015.767 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:47:12.015.936 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:47:12.015.997 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:47:17.016.165 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:47:17.016.231 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:47:22.016.401 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:47:22.016.460 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:47:27.016.634 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:47:27.016.709 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:47:32.016.884 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:47:32.017.901 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:47:37.018.062 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:47:37.018.128 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:47:42.018.292 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:47:42.018.359 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:47:47.018.521 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:47:47.019.962 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:47:52.020.121 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:47:52.020.188 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:47:57.020.349 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:47:57.020.410 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:48:02.020.580 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:48:02.022.423 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:48:07.022.611 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:48:07.027.401 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:48:12.027.545 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:48:12.027.598 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:48:17.027.749 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:48:17.031.170 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:48:22.031.325 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:48:22.033.383 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:48:27.033.545 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:48:27.033.617 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:48:32.033.772 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:48:32.033.840 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:48:37.034.000 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:48:37.034.814 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:48:42.034.965 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:48:42.035.843 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:48:47.035.995 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:48:47.036.060 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:48:52.036.223 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:48:52.036.285 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:48:57.041.197 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:48:57.041.260 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:49:02.041.469 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:49:02.041.535 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:49:07.042.482 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:49:07.050.077 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:49:12.050.235 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:49:12.050.300 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:49:17.067.480 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:49:17.067.545 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:49:22.069.035 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:49:22.069.111 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:49:27.069.267 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:49:27.069.337 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:49:32.069.730 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:49:32.069.800 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:49:37.072.585 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:49:37.072.654 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:49:42.074.221 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:49:42.074.287 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:49:47.076.566 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:49:47.076.629 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:49:52.076.828 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:49:52.076.885 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:49:57.077.040 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:49:57.077.097 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:50:02.077.270 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:50:02.077.346 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:50:07.077.515 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:50:07.077.591 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:50:12.077.763 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:50:12.077.855 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:50:17.078.034 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:50:17.078.113 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:50:22.078.299 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:50:22.078.363 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:50:27.078.537 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:50:27.078.599 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:50:32.078.762 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:50:32.078.834 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:50:37.079.000 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:50:37.079.063 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:50:42.079.223 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:50:42.079.278 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:50:47.079.440 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:50:47.079.501 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:50:52.079.657 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:50:52.079.732 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:50:57.079.920 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:50:57.079.980 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:51:02.080.139 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:51:02.080.210 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:51:07.080.378 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:51:07.080.453 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:51:12.080.615 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:51:12.080.671 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:51:17.080.823 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:51:17.080.882 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:51:22.081.028 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:51:22.081.094 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:51:27.081.257 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:51:27.081.323 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:51:32.081.500 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:51:32.081.571 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:51:37.081.734 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:51:37.081.828 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:51:42.081.973 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:51:42.082.038 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:51:47.082.183 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:51:47.082.236 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:51:52.082.393 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:51:52.082.450 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:51:57.082.607 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:51:57.082.664 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:52:02.082.821 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:52:02.082.890 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:52:07.083.053 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:52:07.083.112 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:52:12.083.277 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:52:12.083.335 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:52:17.083.482 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:52:17.083.543 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:52:22.083.740 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:52:22.083.806 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:52:27.083.968 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:52:27.084.024 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:52:32.084.184 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:52:32.084.239 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:52:37.084.408 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:52:37.084.475 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:52:42.084.623 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:52:42.084.685 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:52:47.084.842 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:52:47.084.896 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:52:52.085.063 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:52:52.085.119 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:52:57.085.239 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:52:57.085.297 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:53:02.085.473 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:53:02.085.539 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:53:07.085.706 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:53:07.085.776 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:53:12.085.935 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:53:12.086.003 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:53:17.086.159 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:53:17.086.218 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:53:22.086.384 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:53:22.086.449 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:53:27.086.618 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:53:27.086.675 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:53:32.086.820 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:53:32.086.886 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:53:37.087.017 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:53:37.087.087 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:53:42.087.245 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:53:42.087.352 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:53:47.087.502 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:53:47.087.566 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:53:52.087.723 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:53:52.087.788 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:53:57.087.957 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:53:57.088.024 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:54:02.088.177 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:54:02.088.244 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:54:07.088.414 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:54:07.088.471 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:54:12.088.628 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:54:12.088.692 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:54:17.088.857 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:54:17.088.916 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:54:22.089.084 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:54:22.089.149 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:54:27.089.346 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:54:27.089.407 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:54:32.089.573 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:54:32.089.637 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:54:37.089.797 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:54:37.089.852 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:54:42.090.012 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:54:42.090.074 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:54:47.090.244 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:54:47.090.316 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:54:52.090.478 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:54:52.090.544 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:54:57.090.714 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:54:57.090.786 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:55:02.090.964 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:55:02.091.035 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:55:07.091.204 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:55:07.091.319 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:55:12.091.480 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:55:12.091.547 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:55:17.092.331 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:55:17.092.404 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:55:22.092.582 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:55:22.092.648 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:55:27.092.819 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:55:27.092.890 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:55:32.093.059 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:55:32.093.130 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:55:37.093.293 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:55:37.093.361 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:55:42.093.535 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:55:42.093.606 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:55:47.093.777 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:55:47.093.842 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:55:52.094.028 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:55:52.094.097 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:55:57.094.267 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:55:57.094.324 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:56:02.094.494 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:56:02.094.553 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:56:07.094.723 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:56:07.094.789 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:56:12.094.949 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:56:12.095.002 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:56:17.095.181 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:56:17.095.244 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:56:22.095.409 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:56:22.095.465 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:56:27.095.628 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:56:27.095.683 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:56:32.095.852 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:56:32.095.949 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:56:37.096.111 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:56:37.096.166 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:56:42.096.318 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:56:42.096.384 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:56:47.096.560 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:56:47.096.631 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:56:52.096.802 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:56:52.096.857 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:56:57.097.015 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:56:57.097.083 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:57:02.097.244 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:57:02.097.309 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:57:07.097.479 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:57:07.097.542 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:57:12.097.700 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:57:12.097.807 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:57:17.097.970 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:57:17.098.046 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:57:22.098.207 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:57:22.098.270 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:57:27.098.452 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:57:27.098.514 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:57:32.098.680 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:57:32.098.750 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:57:37.098.918 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:57:37.098.984 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:57:42.099.151 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:57:42.099.220 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:57:47.099.391 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:57:47.099.467 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:57:52.099.727 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:57:52.099.840 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:57:57.100.042 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:57:57.100.107 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:58:02.100.272 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:58:02.100.340 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:58:07.100.496 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:58:07.100.574 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:58:12.100.748 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:58:12.100.813 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:58:17.100.977 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:58:17.101.041 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:58:22.101.210 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:58:22.101.276 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:58:27.101.435 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:58:27.101.506 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:58:32.101.682 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:58:32.101.751 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:58:37.101.924 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:58:37.102.033 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:58:42.102.189 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:58:42.102.254 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:58:47.102.419 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:58:47.102.483 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:58:52.102.654 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:58:52.102.719 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:58:57.102.888 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:58:57.102.954 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:59:02.103.123 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:59:02.103.193 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:59:07.103.367 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:59:07.103.438 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:59:12.103.600 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:59:12.103.672 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:59:17.103.831 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:59:17.103.890 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:59:22.104.078 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:59:22.104.147 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:59:27.104.313 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:59:27.104.370 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:59:32.104.546 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:59:32.104.615 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:59:37.104.783 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:59:37.104.849 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:59:42.105.016 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:59:42.105.088 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:59:47.105.260 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:59:47.105.326 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:59:52.105.482 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:59:52.105.548 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:59:57.105.720 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-05:59:57.105.794 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:00:02.105.966 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:00:02.106.079 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:00:07.106.241 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:00:07.106.309 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:00:12.106.467 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:00:12.106.535 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:00:17.106.702 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:00:17.106.779 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:00:22.106.956 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:00:22.107.026 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:00:27.107.195 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:00:27.107.266 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:00:32.107.428 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:00:32.107.501 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:00:37.107.665 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:00:37.107.730 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:00:42.107.904 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:00:42.108.477 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:00:47.108.632 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:00:47.108.692 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:00:52.108.856 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:00:52.108.921 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:00:57.109.091 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:00:57.109.161 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:01:02.109.331 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:01:02.109.394 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:01:07.109.563 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:01:07.109.633 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:01:12.109.805 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:01:12.109.873 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:01:17.110.030 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:01:17.110.100 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:01:22.110.270 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:01:22.110.343 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:01:27.110.541 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:01:27.110.608 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:01:32.110.775 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:01:32.110.844 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:01:37.111.009 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:01:37.111.074 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:01:42.111.253 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:01:42.111.318 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:01:47.111.480 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:01:47.111.535 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:01:52.111.704 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:01:52.111.772 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:01:57.111.940 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:01:57.112.017 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:02:02.112.195 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:02:02.112.253 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:02:07.112.420 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:02:07.112.522 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:02:12.112.691 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:02:12.112.751 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:02:17.112.920 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:02:17.112.991 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:02:22.113.147 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:02:22.113.212 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:02:27.113.381 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:02:27.113.443 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:02:32.113.605 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:02:32.113.674 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:02:37.113.842 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:02:37.113.913 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:02:42.114.084 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:02:42.114.154 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:02:47.114.327 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:02:47.114.393 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:02:52.114.589 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:02:52.114.660 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:02:57.114.827 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:02:57.114.889 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:03:02.115.057 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:03:02.115.123 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:03:07.115.298 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:03:07.115.371 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:03:12.115.544 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:03:12.115.606 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:03:17.115.773 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:03:17.115.839 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:03:22.116.008 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:03:22.116.079 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:03:27.116.246 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:03:27.116.312 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:03:32.116.481 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:03:32.116.606 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:03:37.116.798 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:03:37.116.863 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:03:42.117.028 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:03:42.117.095 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:03:47.117.252 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:03:47.117.305 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:03:52.117.471 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:03:52.117.540 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:03:57.117.700 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:03:57.117.756 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:04:02.117.924 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:04:02.117.995 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:04:07.118.162 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:04:07.118.229 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:04:12.118.400 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:04:12.118.463 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:04:17.118.658 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:04:17.118.725 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:04:22.118.886 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:04:22.118.952 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:04:27.119.111 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:04:27.119.168 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:04:32.119.337 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:04:32.119.410 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:04:37.119.584 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:04:37.119.643 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:04:42.119.819 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:04:42.119.888 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:04:47.120.058 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:04:47.120.119 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:04:52.120.281 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:04:52.120.346 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:04:57.120.554 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:04:57.120.615 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:05:02.120.786 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:05:02.120.847 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:05:07.121.018 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:05:07.121.077 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:05:12.121.232 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:05:12.121.285 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:05:17.121.460 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:05:17.121.520 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:05:22.121.684 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:05:22.121.743 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:05:27.122.592 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:05:27.122.663 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:05:32.122.826 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:05:32.122.890 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:05:37.123.057 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:05:37.123.170 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:05:42.123.331 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:05:42.123.400 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:05:47.123.563 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:05:47.123.626 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:05:52.123.783 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:05:52.123.848 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:05:57.124.020 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:05:57.124.090 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:06:02.124.254 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:06:02.124.321 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:06:07.124.493 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:06:07.124.576 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:06:12.124.740 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:06:12.124.804 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:06:17.124.975 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:06:17.125.052 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:06:22.125.249 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:06:22.125.317 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:06:27.125.489 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:06:27.125.561 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:06:32.125.726 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:06:32.125.795 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:06:37.125.965 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:06:37.126.036 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:06:42.126.204 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:06:42.126.266 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:06:47.126.431 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:06:47.126.502 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:06:52.126.662 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:06:52.126.725 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:06:57.126.894 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:06:57.126.963 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:07:02.127.128 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:07:02.127.236 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:07:07.127.396 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:07:07.127.465 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:07:12.127.634 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:07:12.127.704 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:07:17.127.873 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:07:17.127.947 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:07:22.128.114 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:07:22.128.176 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:07:27.128.352 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:07:27.128.424 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:07:32.128.603 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:07:32.128.665 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:07:37.128.822 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:07:37.128.877 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:07:42.129.045 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:07:42.129.110 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:07:47.129.306 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:07:47.129.372 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:07:52.129.542 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:07:52.129.612 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:07:57.129.774 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:07:57.129.828 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:08:02.129.998 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:08:02.130.068 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:08:07.130.239 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:08:07.130.310 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:08:12.130.476 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:08:12.130.546 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:08:17.130.716 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:08:17.130.793 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:08:22.130.945 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:08:22.131.008 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:08:27.131.206 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:08:27.131.279 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:08:32.131.445 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:08:32.131.513 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:08:37.131.677 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:08:37.131.736 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:08:42.131.908 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:08:42.131.971 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:08:47.132.144 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:08:47.132.212 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:08:52.132.383 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:08:52.132.448 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:08:57.132.633 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:08:57.132.707 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:09:02.132.871 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:09:02.132.942 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:09:07.133.111 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:09:07.133.208 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:09:12.133.370 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:09:12.133.442 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:09:17.133.614 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:09:17.133.683 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:09:22.133.853 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:09:22.133.926 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:09:27.134.097 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:09:27.134.156 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:09:32.134.314 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:09:32.134.392 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:09:37.134.536 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:09:37.134.602 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:09:42.134.769 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:09:42.134.834 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:09:47.135.003 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:09:47.135.074 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:09:52.135.261 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:09:52.135.326 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:09:57.135.491 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:09:57.135.548 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:10:02.135.668 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:10:02.135.734 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:10:07.135.898 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:10:07.135.969 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:10:12.136.141 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:10:12.136.210 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:10:17.136.379 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:10:17.136.438 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:10:22.136.616 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:10:22.136.685 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:10:27.136.859 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:10:27.136.921 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:10:32.137.091 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:10:32.137.203 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:10:37.137.367 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:10:37.137.437 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:10:42.137.613 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:10:42.137.690 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:10:47.137.856 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:10:47.137.922 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:10:52.138.091 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:10:52.138.164 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:10:57.138.333 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:10:57.138.395 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:11:02.138.559 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:11:02.138.630 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:11:07.138.817 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:11:07.138.883 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:11:12.139.044 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:11:12.139.116 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:11:17.139.308 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:11:17.139.505 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:11:22.139.661 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:11:22.139.728 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:11:27.139.890 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:11:27.139.960 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,fffd83fff1e0,python):2024-07-30-06:11:31.696.365 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:295] ProcessUnregister] Node 0 has unregistered. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:11:32.140.103 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 3 alive nodes. +[WARNING] DISTRIBUTED(978947,ffffb95c2010,python):2024-07-30-06:11:32.940.506 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(978947,fffd83fff1e0,python):2024-07-30-06:11:35.317.643 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:295] ProcessUnregister] Node 1 has unregistered. +[WARNING] DISTRIBUTED(978947,fffd83fff1e0,python):2024-07-30-06:11:35.470.292 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:295] ProcessUnregister] Node 3 has unregistered. +[WARNING] DISTRIBUTED(978947,fffd83fff1e0,python):2024-07-30-06:11:35.495.896 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:295] ProcessUnregister] Node 2 has unregistered. +/arrow/cpp/src/arrow/filesystem/s3fs.cc:2598: arrow::fs::FinalizeS3 was not called even though S3 was initialized. This could lead to a segmentation fault at exit diff --git "a/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/2. \345\276\256\350\260\203\346\227\245\345\277\227\344\270\216\351\205\215\347\275\256/finetune_msrun_log/worker_0.log" "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/2. \345\276\256\350\260\203\346\227\245\345\277\227\344\270\216\351\205\215\347\275\256/finetune_msrun_log/worker_0.log" new file mode 100644 index 00000000..9deeba1b --- /dev/null +++ "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/2. \345\276\256\350\260\203\346\227\245\345\277\227\344\270\216\351\205\215\347\275\256/finetune_msrun_log/worker_0.log" @@ -0,0 +1,10218 @@ +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:499: UserWarning: The value of the smallest subnormal for type is zero. + setattr(self, word, getattr(machar, word).flat[0]) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:89: UserWarning: The value of the smallest subnormal for type is zero. + return self._float_to_str(self.smallest_subnormal) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:499: UserWarning: The value of the smallest subnormal for type is zero. + setattr(self, word, getattr(machar, word).flat[0]) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:89: UserWarning: The value of the smallest subnormal for type is zero. + return self._float_to_str(self.smallest_subnormal) +[WARNING] DISTRIBUTED(978967,ffff87186010,python):2024-07-30-02:07:40.563.986 [mindspore/ccsrc/distributed/rpc/tcp/tcp_comm.cc:464] Connect] Waiting for the state of the connection to 127.0.0.1:8118 to be connected...Retry number: 1 +[WARNING] DISTRIBUTED(978967,ffff87186010,python):2024-07-30-02:07:41.564.820 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:194] BuildCluster] Topology build timed out., retry(1/200). +[WARNING] DISTRIBUTED(978967,ffff87186010,python):2024-07-30-02:07:44.565.003 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:194] BuildCluster] Topology build timed out., retry(2/200). +[WARNING] DISTRIBUTED(978967,ffff87186010,python):2024-07-30-02:07:47.565.202 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:196] BuildCluster] Cluster is successfully initialized. +[WARNING] DISTRIBUTED(978967,ffff87186010,python):2024-07-30-02:07:47.565.635 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:260] PostProcess] This node 0 rank id: 0 +[WARNING] DISTRIBUTED(978967,ffff87186010,python):2024-07-30-02:08:11.695.710 [mindspore/ccsrc/distributed/collective/collective_manager.cc:259] CreateCommunicationGroup] Start to create communication group: hccl_world_group [const vector]{0, 1, 2, 3} +[WARNING] DISTRIBUTED(978967,ffff87186010,python):2024-07-30-02:08:11.698.045 [mindspore/ccsrc/distributed/collective/collective_manager.cc:335] CreateCommunicationGroup] Begin initialize communication group on the device side: hccl_world_group +[WARNING] DISTRIBUTED(978967,ffff87186010,python):2024-07-30-02:08:14.445.512 [mindspore/ccsrc/distributed/collective/collective_manager.cc:345] CreateCommunicationGroup] End initialize communication group on the device side: hccl_world_group +2024-07-30 02:08:14,448 - mindformers[mindformers/tools/utils.py:168] - INFO - set strategy path to './output/strategy/ckpt_strategy_rank_0.ckpt' +2024-07-30 02:08:14,482 - mindformers[mindformers/trainer/trainer.py:919] - INFO - Load configs in /home/ma-user/work/mindformers/configs/gpt2/run_gpt2.yaml to build trainer. +2024-07-30 02:08:14,482 - mindformers[mindformers/trainer/trainer.py:949] - INFO - ..........Init Config.......... +2024-07-30 02:08:14,482 - mindformers[mindformers/core/parallel_config.py:45] - INFO - initial recompute_config from dict: {'recompute': True, 'select_recompute': False, 'parallel_optimizer_comm_recompute': False, 'mp_comm_recompute': True, 'recompute_slice_activation': True} +2024-07-30 02:08:14,482 - mindformers[mindformers/core/parallel_config.py:51] - INFO - initial parallel_config from dict: {'data_parallel': 1, 'model_parallel': 4, 'pipeline_stage': 1, 'use_seq_parallel': False, 'micro_batch_num': 1, 'vocab_emb_dp': True, 'gradient_aggregation_group': 4} +2024-07-30 02:08:14,483 - mindformers[mindformers/tools/utils.py:153] - INFO - set output path to '/home/ma-user/work/mindformers/research/output' +2024-07-30 02:08:14,484 - mindformers[mindformers/trainer/base_trainer.py:85] - INFO - Now Running Task is: text_generation, Model is: llama3_8b +2024-07-30 02:08:14,484 - mindformers[mindformers/trainer/base_trainer.py:111] - WARNING - Input model name is not in the supported list or unspecified. +2024-07-30 02:08:14,484 - mindformers[mindformers/trainer/base_trainer.py:112] - WARNING - See the list of supported task and model name: ['baichuan2_13b', 'baichuan2_7b', 'baichuan_7b', 'bloom_176b', 'bloom_560m', 'bloom_65b', 'bloom_7.1b', 'codegeex2_6b', 'codellama_34b', 'common', 'deepseek_33b', 'glm2_6b', 'glm2_6b_lora', 'glm2_6b_ptuning2', 'glm3_6b', 'glm_6b', 'glm_6b_chat', 'glm_6b_lora', 'glm_6b_lora_chat', 'gpt2', 'gpt2_13b', 'gpt2_52b', 'gpt2_lora', 'gpt2_xl', 'gpt2_xl_lora', 'internlm_7b', 'internlm_7b_lora', 'llama2_13b', 'llama2_70b', 'llama2_7b', 'llama_13b', 'llama_65b', 'llama_7b', 'llama_7b_lora', 'pangualpha_13b', 'pangualpha_2_6b', 'qwen_7b', 'qwen_7b_lora', 'skywork_13b', 'yi_34b', 'yi_6b', 'ziya_13b'] +2024-07-30 02:08:14,485 - mindformers[mindformers/trainer/base_trainer.py:113] - WARNING - The default model config: /home/ma-user/work/mindformers/configs/gpt2/run_gpt2.yaml will now be used for the text_generation task +2024-07-30 02:08:14,485 - mindformers[mindformers/trainer/trainer.py:1004] - INFO - ..........Init Model.......... +2024-07-30 02:08:14,485 - mindformers[mindformers/trainer/trainer.py:1027] - INFO - ..........Init Train Dataset.......... +2024-07-30 02:08:14,485 - mindformers[mindformers/trainer/trainer.py:335] - INFO - ==========Trainer Init Success!========== +2024-07-30 02:08:14,485 - mindformers[mindformers/trainer/trainer.py:476] - WARNING - The `finetune_checkpoint` will be deprecated. Please use `resume_from_checkpoint` instead. +2024-07-30 02:08:14,486 - mindformers[mindformers/trainer/trainer.py:1004] - INFO - ..........Init Model.......... +2024-07-30 02:08:14,486 - mindformers[mindformers/trainer/base_trainer.py:176] - INFO - The current parallel mode is semi_auto_parallel, full batch is True,so global batch size will be changed: global_batch_size = batch_size * data_parallel * micro_batch_interleave_num * gradient_accumulation_steps = 32 = 32 * 1 * 1 * 1 +2024-07-30 02:08:14,486 - mindformers[mindformers/trainer/base_trainer.py:624] - INFO - .........Build Dataset For Train.......... +2024-07-30 02:08:14,486 - mindformers[mindformers/trainer/base_trainer.py:353] - INFO - .........Build Dataset From Config.......... +2024-07-30 02:08:14,487 - mindformers[mindformers/dataset/causal_language_model_dataset.py:166] - INFO - Now Create Causal Language Model Dataset. +2024-07-30 02:08:14,496 - mindformers[mindformers/trainer/base_trainer.py:626] - INFO - Create train dataset finish, dataset size:3125 +2024-07-30 02:08:14,496 - mindformers[mindformers/trainer/utils.py:171] - INFO - Will be Training epochs:3, sink_size:2 +2024-07-30 02:08:14,496 - mindformers[mindformers/trainer/utils.py:173] - INFO - Create training dataset finish, dataset size:3125 +2024-07-30 02:08:14,497 - mindformers[mindformers/trainer/base_trainer.py:656] - INFO - .........Build Net For Train.......... +2024-07-30 02:08:14,497 - mindformers[mindformers/trainer/base_trainer.py:387] - INFO - .........Build Network From Config.......... +2024-07-30 02:08:14,498 - mindformers[mindformers/version_control.py:61] - INFO - The Cell Reuse compilation acceleration feature is not supported when the environment variable ENABLE_CELL_REUSE is 0 or MindSpore version is earlier than 2.1.0 or stand_alone mode or pipeline_stages <= 1 +2024-07-30 02:08:14,498 - mindformers[mindformers/version_control.py:65] - INFO - +The current ENABLE_CELL_REUSE=0, please set the environment variable as follows: +export ENABLE_CELL_REUSE=1 to enable the Cell Reuse compilation acceleration feature. +2024-07-30 02:08:14,498 - mindformers[mindformers/version_control.py:74] - INFO - The Cell Reuse compilation acceleration feature only works in pipeline parallel mode(pipeline_stage>1).Current pipeline stage=1, the feature is disabled by default. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:08:14.500.440 [/home/ma-user/work/mindformers/mindformers/modules/transformer/op_parallel_config.py:244] The optimizer shard True in auto_parallel_context is not equal to the optimizer_shard None in the OpParallelConfig. Please check the optimizer_shard to make them consistent. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:08:14.503.076 [/home/ma-user/work/mindformers/mindformers/modules/transformer/op_parallel_config.py:244] The optimizer shard True in auto_parallel_context is not equal to the optimizer_shard None in the OpParallelConfig. Please check the optimizer_shard to make them consistent. +2024-07-30 02:08:14,615 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:08:14.616.932 [mindspore/common/_decorator.py:40] 'Parameter' is deprecated from version 2.3 and will be removed in a future version, use 'add_pipeline_stage' instead. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:08:14.617.075 [mindspore/common/parameter.py:806] This interface may be deleted in the future. +2024-07-30 02:08:14,637 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,658 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,679 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,700 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,721 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,742 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,764 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,785 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,807 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:15,282 - mindformers[mindformers/models/modeling_utils.py:1438] - INFO - model built, but weights is unloaded, since the config has no checkpoint_name_or_path attribute or checkpoint_name_or_path is None. +2024-07-30 02:08:15,480 - mindformers[mindformers/models/modeling_utils.py:1438] - INFO - model built, but weights is unloaded, since the config has no checkpoint_name_or_path attribute or checkpoint_name_or_path is None. +[INFO] 2024-07-30 02:08:15,481 [978967] [SDK] : Start to freeze model for delta, mode: lora, include list: None, exclude list: None +[INFO] 2024-07-30 02:08:15,482 [978967] [SDK] : Start to freeze model, include list: ['*'], exclude list: ['*mindpet_delta_lora*'] +[INFO] 2024-07-30 02:08:15,488 [978967] [SDK] : End to freeze model. +[INFO] 2024-07-30 02:08:15,488 [978967] [SDK] : End to freeze model for delta. +2024-07-30 02:08:15,502 - mindformers[mindformers/trainer/base_trainer.py:543] - INFO - Network Parameters: 3407872. +2024-07-30 02:08:15,503 - mindformers[mindformers/trainer/base_trainer.py:678] - INFO - .........Build Optimizer For Train.......... +2024-07-30 02:08:15,503 - mindformers[mindformers/trainer/base_trainer.py:426] - INFO - .........Build Optimizer From Config.......... +2024-07-30 02:08:15,503 - mindformers[mindformers/trainer/base_trainer.py:459] - INFO - .........Build LR Schedule From Config.......... +2024-07-30 02:08:15,509 - mindformers[mindformers/trainer/optimizer_grouped_parameters.py:74] - WARNING - dynamic_lr_schedule will be reset and invalid when layer_scale is False. +2024-07-30 02:08:15,512 - mindformers[mindformers/trainer/optimizer_grouped_parameters.py:113] - INFO - Param groups = { + "decay": { + "weight_decay": 0.0, + "params": [ + "model.layers.0.attention.wq.mindpet_delta_lora_a", + "model.layers.0.attention.wq.mindpet_delta_lora_b", + "model.layers.0.attention.wv.mindpet_delta_lora_a", + "model.layers.0.attention.wv.mindpet_delta_lora_b", + "model.layers.1.attention.wq.mindpet_delta_lora_a", + "model.layers.1.attention.wq.mindpet_delta_lora_b", + "model.layers.1.attention.wv.mindpet_delta_lora_a", + "model.layers.1.attention.wv.mindpet_delta_lora_b", + "model.layers.2.attention.wq.mindpet_delta_lora_a", + "model.layers.2.attention.wq.mindpet_delta_lora_b", + "model.layers.2.attention.wv.mindpet_delta_lora_a", + "model.layers.2.attention.wv.mindpet_delta_lora_b", + "model.layers.3.attention.wq.mindpet_delta_lora_a", + "model.layers.3.attention.wq.mindpet_delta_lora_b", + "model.layers.3.attention.wv.mindpet_delta_lora_a", + "model.layers.3.attention.wv.mindpet_delta_lora_b", + "model.layers.4.attention.wq.mindpet_delta_lora_a", + "model.layers.4.attention.wq.mindpet_delta_lora_b", + "model.layers.4.attention.wv.mindpet_delta_lora_a", + "model.layers.4.attention.wv.mindpet_delta_lora_b", + "model.layers.5.attention.wq.mindpet_delta_lora_a", + "model.layers.5.attention.wq.mindpet_delta_lora_b", + "model.layers.5.attention.wv.mindpet_delta_lora_a", + "model.layers.5.attention.wv.mindpet_delta_lora_b", + "model.layers.6.attention.wq.mindpet_delta_lora_a", + "model.layers.6.attention.wq.mindpet_delta_lora_b", + "model.layers.6.attention.wv.mindpet_delta_lora_a", + "model.layers.6.attention.wv.mindpet_delta_lora_b", + "model.layers.7.attention.wq.mindpet_delta_lora_a", + "model.layers.7.attention.wq.mindpet_delta_lora_b", + "model.layers.7.attention.wv.mindpet_delta_lora_a", + "model.layers.7.attention.wv.mindpet_delta_lora_b", + "model.layers.8.attention.wq.mindpet_delta_lora_a", + "model.layers.8.attention.wq.mindpet_delta_lora_b", + "model.layers.8.attention.wv.mindpet_delta_lora_a", + "model.layers.8.attention.wv.mindpet_delta_lora_b", + "model.layers.9.attention.wq.mindpet_delta_lora_a", + "model.layers.9.attention.wq.mindpet_delta_lora_b", + "model.layers.9.attention.wv.mindpet_delta_lora_a", + "model.layers.9.attention.wv.mindpet_delta_lora_b", + "model.layers.10.attention.wq.mindpet_delta_lora_a", + "model.layers.10.attention.wq.mindpet_delta_lora_b", + "model.layers.10.attention.wv.mindpet_delta_lora_a", + "model.layers.10.attention.wv.mindpet_delta_lora_b", + "model.layers.11.attention.wq.mindpet_delta_lora_a", + "model.layers.11.attention.wq.mindpet_delta_lora_b", + "model.layers.11.attention.wv.mindpet_delta_lora_a", + "model.layers.11.attention.wv.mindpet_delta_lora_b", + "model.layers.12.attention.wq.mindpet_delta_lora_a", + "model.layers.12.attention.wq.mindpet_delta_lora_b", + "model.layers.12.attention.wv.mindpet_delta_lora_a", + "model.layers.12.attention.wv.mindpet_delta_lora_b", + "model.layers.13.attention.wq.mindpet_delta_lora_a", + "model.layers.13.attention.wq.mindpet_delta_lora_b", + "model.layers.13.attention.wv.mindpet_delta_lora_a", + "model.layers.13.attention.wv.mindpet_delta_lora_b", + "model.layers.14.attention.wq.mindpet_delta_lora_a", + "model.layers.14.attention.wq.mindpet_delta_lora_b", + "model.layers.14.attention.wv.mindpet_delta_lora_a", + "model.layers.14.attention.wv.mindpet_delta_lora_b", + "model.layers.15.attention.wq.mindpet_delta_lora_a", + "model.layers.15.attention.wq.mindpet_delta_lora_b", + "model.layers.15.attention.wv.mindpet_delta_lora_a", + "model.layers.15.attention.wv.mindpet_delta_lora_b", + "model.layers.16.attention.wq.mindpet_delta_lora_a", + "model.layers.16.attention.wq.mindpet_delta_lora_b", + "model.layers.16.attention.wv.mindpet_delta_lora_a", + "model.layers.16.attention.wv.mindpet_delta_lora_b", + "model.layers.17.attention.wq.mindpet_delta_lora_a", + "model.layers.17.attention.wq.mindpet_delta_lora_b", + "model.layers.17.attention.wv.mindpet_delta_lora_a", + "model.layers.17.attention.wv.mindpet_delta_lora_b", + "model.layers.18.attention.wq.mindpet_delta_lora_a", + "model.layers.18.attention.wq.mindpet_delta_lora_b", + "model.layers.18.attention.wv.mindpet_delta_lora_a", + "model.layers.18.attention.wv.mindpet_delta_lora_b", + "model.layers.19.attention.wq.mindpet_delta_lora_a", + "model.layers.19.attention.wq.mindpet_delta_lora_b", + "model.layers.19.attention.wv.mindpet_delta_lora_a", + "model.layers.19.attention.wv.mindpet_delta_lora_b", + "model.layers.20.attention.wq.mindpet_delta_lora_a", + "model.layers.20.attention.wq.mindpet_delta_lora_b", + "model.layers.20.attention.wv.mindpet_delta_lora_a", + "model.layers.20.attention.wv.mindpet_delta_lora_b", + "model.layers.21.attention.wq.mindpet_delta_lora_a", + "model.layers.21.attention.wq.mindpet_delta_lora_b", + "model.layers.21.attention.wv.mindpet_delta_lora_a", + "model.layers.21.attention.wv.mindpet_delta_lora_b", + "model.layers.22.attention.wq.mindpet_delta_lora_a", + "model.layers.22.attention.wq.mindpet_delta_lora_b", + "model.layers.22.attention.wv.mindpet_delta_lora_a", + "model.layers.22.attention.wv.mindpet_delta_lora_b", + "model.layers.23.attention.wq.mindpet_delta_lora_a", + "model.layers.23.attention.wq.mindpet_delta_lora_b", + "model.layers.23.attention.wv.mindpet_delta_lora_a", + "model.layers.23.attention.wv.mindpet_delta_lora_b", + "model.layers.24.attention.wq.mindpet_delta_lora_a", + "model.layers.24.attention.wq.mindpet_delta_lora_b", + "model.layers.24.attention.wv.mindpet_delta_lora_a", + "model.layers.24.attention.wv.mindpet_delta_lora_b", + "model.layers.25.attention.wq.mindpet_delta_lora_a", + "model.layers.25.attention.wq.mindpet_delta_lora_b", + "model.layers.25.attention.wv.mindpet_delta_lora_a", + "model.layers.25.attention.wv.mindpet_delta_lora_b", + "model.layers.26.attention.wq.mindpet_delta_lora_a", + "model.layers.26.attention.wq.mindpet_delta_lora_b", + "model.layers.26.attention.wv.mindpet_delta_lora_a", + "model.layers.26.attention.wv.mindpet_delta_lora_b", + "model.layers.27.attention.wq.mindpet_delta_lora_a", + "model.layers.27.attention.wq.mindpet_delta_lora_b", + "model.layers.27.attention.wv.mindpet_delta_lora_a", + "model.layers.27.attention.wv.mindpet_delta_lora_b", + "model.layers.28.attention.wq.mindpet_delta_lora_a", + "model.layers.28.attention.wq.mindpet_delta_lora_b", + "model.layers.28.attention.wv.mindpet_delta_lora_a", + "model.layers.28.attention.wv.mindpet_delta_lora_b", + "model.layers.29.attention.wq.mindpet_delta_lora_a", + "model.layers.29.attention.wq.mindpet_delta_lora_b", + "model.layers.29.attention.wv.mindpet_delta_lora_a", + "model.layers.29.attention.wv.mindpet_delta_lora_b", + "model.layers.30.attention.wq.mindpet_delta_lora_a", + "model.layers.30.attention.wq.mindpet_delta_lora_b", + "model.layers.30.attention.wv.mindpet_delta_lora_a", + "model.layers.30.attention.wv.mindpet_delta_lora_b", + "model.layers.31.attention.wq.mindpet_delta_lora_a", + "model.layers.31.attention.wq.mindpet_delta_lora_b", + "model.layers.31.attention.wv.mindpet_delta_lora_a", + "model.layers.31.attention.wv.mindpet_delta_lora_b" + ] + } +} +2024-07-30 02:08:15,613 - mindformers[mindformers/trainer/base_trainer.py:683] - INFO - .........Build Running Wrapper From Config For Train.......... +2024-07-30 02:08:15,613 - mindformers[mindformers/trainer/base_trainer.py:496] - INFO - .........Build Model Wrapper for Train From Config.......... +2024-07-30 02:08:15,619 - mindformers[mindformers/trainer/base_trainer.py:687] - INFO - .........Build Callbacks For Train.......... +2024-07-30 02:08:15,621 - mindformers[mindformers/core/callback/callback.py:533] - INFO - Integrated_save is changed to False when using auto_parallel. +2024-07-30 02:08:15,622 - mindformers[mindformers/trainer/base_trainer.py:721] - INFO - .........Starting Init Train Model.......... +2024-07-30 02:08:15,622 - mindformers[mindformers/trainer/utils.py:736] - INFO - ............Start load checkpoint from checkpoint............ +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:09:56.503.2 [mindspore/train/serialization.py:1369] model.tok_embeddings.embedding_weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:00.961.296 [mindspore/train/serialization.py:1369] model.layers.0.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:00.962.110 [mindspore/train/serialization.py:1369] model.layers.0.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:00.962.570 [mindspore/train/serialization.py:1369] model.layers.0.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:01.110.021 [mindspore/train/serialization.py:1369] model.layers.0.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:01.151.680 [mindspore/train/serialization.py:1369] model.layers.0.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:01.195.050 [mindspore/train/serialization.py:1369] model.layers.0.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:01.345.373 [mindspore/train/serialization.py:1369] model.layers.0.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:01.934.983 [mindspore/train/serialization.py:1369] model.layers.0.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:02.509.002 [mindspore/train/serialization.py:1369] model.layers.0.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:03.960.82 [mindspore/train/serialization.py:1369] model.layers.1.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:03.968.64 [mindspore/train/serialization.py:1369] model.layers.1.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:03.973.06 [mindspore/train/serialization.py:1369] model.layers.1.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:03.242.694 [mindspore/train/serialization.py:1369] model.layers.1.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:03.286.352 [mindspore/train/serialization.py:1369] model.layers.1.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:03.325.404 [mindspore/train/serialization.py:1369] model.layers.1.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:03.470.921 [mindspore/train/serialization.py:1369] model.layers.1.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:04.455.89 [mindspore/train/serialization.py:1369] model.layers.1.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:04.609.872 [mindspore/train/serialization.py:1369] model.layers.1.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:05.184.213 [mindspore/train/serialization.py:1369] model.layers.2.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:05.185.116 [mindspore/train/serialization.py:1369] model.layers.2.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:05.185.587 [mindspore/train/serialization.py:1369] model.layers.2.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:05.336.794 [mindspore/train/serialization.py:1369] model.layers.2.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:05.377.797 [mindspore/train/serialization.py:1369] model.layers.2.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:05.418.926 [mindspore/train/serialization.py:1369] model.layers.2.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:05.570.420 [mindspore/train/serialization.py:1369] model.layers.2.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:06.141.535 [mindspore/train/serialization.py:1369] model.layers.2.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:06.710.987 [mindspore/train/serialization.py:1369] model.layers.2.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:07.279.124 [mindspore/train/serialization.py:1369] model.layers.3.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:07.280.026 [mindspore/train/serialization.py:1369] model.layers.3.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:07.280.466 [mindspore/train/serialization.py:1369] model.layers.3.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:07.443.955 [mindspore/train/serialization.py:1369] model.layers.3.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:07.484.923 [mindspore/train/serialization.py:1369] model.layers.3.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:07.526.062 [mindspore/train/serialization.py:1369] model.layers.3.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:07.695.970 [mindspore/train/serialization.py:1369] model.layers.3.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:08.270.354 [mindspore/train/serialization.py:1369] model.layers.3.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:08.949.715 [mindspore/train/serialization.py:1369] model.layers.3.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:09.516.736 [mindspore/train/serialization.py:1369] model.layers.4.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:09.517.605 [mindspore/train/serialization.py:1369] model.layers.4.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:09.518.146 [mindspore/train/serialization.py:1369] model.layers.4.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:09.679.014 [mindspore/train/serialization.py:1369] model.layers.4.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:09.720.913 [mindspore/train/serialization.py:1369] model.layers.4.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:09.765.113 [mindspore/train/serialization.py:1369] model.layers.4.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:09.926.689 [mindspore/train/serialization.py:1369] model.layers.4.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:10.501.225 [mindspore/train/serialization.py:1369] model.layers.4.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:11.585.47 [mindspore/train/serialization.py:1369] model.layers.4.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:11.630.323 [mindspore/train/serialization.py:1369] model.layers.5.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:11.631.298 [mindspore/train/serialization.py:1369] model.layers.5.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:11.631.818 [mindspore/train/serialization.py:1369] model.layers.5.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:11.853.157 [mindspore/train/serialization.py:1369] model.layers.5.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:11.964.051 [mindspore/train/serialization.py:1369] model.layers.5.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:12.658.7 [mindspore/train/serialization.py:1369] model.layers.5.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:12.186.238 [mindspore/train/serialization.py:1369] model.layers.5.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:12.764.637 [mindspore/train/serialization.py:1369] model.layers.5.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:13.332.731 [mindspore/train/serialization.py:1369] model.layers.5.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:13.900.676 [mindspore/train/serialization.py:1369] model.layers.6.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:13.901.623 [mindspore/train/serialization.py:1369] model.layers.6.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:13.902.074 [mindspore/train/serialization.py:1369] model.layers.6.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:14.689.20 [mindspore/train/serialization.py:1369] model.layers.6.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:14.112.582 [mindspore/train/serialization.py:1369] model.layers.6.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:14.154.968 [mindspore/train/serialization.py:1369] model.layers.6.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:14.326.702 [mindspore/train/serialization.py:1369] model.layers.6.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:14.887.610 [mindspore/train/serialization.py:1369] model.layers.6.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:15.447.865 [mindspore/train/serialization.py:1369] model.layers.6.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:16.157.17 [mindspore/train/serialization.py:1369] model.layers.7.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:16.166.73 [mindspore/train/serialization.py:1369] model.layers.7.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:16.171.39 [mindspore/train/serialization.py:1369] model.layers.7.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:16.175.380 [mindspore/train/serialization.py:1369] model.layers.7.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:16.218.195 [mindspore/train/serialization.py:1369] model.layers.7.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:16.265.524 [mindspore/train/serialization.py:1369] model.layers.7.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:16.433.779 [mindspore/train/serialization.py:1369] model.layers.7.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:17.523.8 [mindspore/train/serialization.py:1369] model.layers.7.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:17.581.290 [mindspore/train/serialization.py:1369] model.layers.7.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:18.154.512 [mindspore/train/serialization.py:1369] model.layers.8.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:18.155.319 [mindspore/train/serialization.py:1369] model.layers.8.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:18.155.800 [mindspore/train/serialization.py:1369] model.layers.8.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:18.331.273 [mindspore/train/serialization.py:1369] model.layers.8.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:18.388.423 [mindspore/train/serialization.py:1369] model.layers.8.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:18.433.921 [mindspore/train/serialization.py:1369] model.layers.8.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:18.630.046 [mindspore/train/serialization.py:1369] model.layers.8.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:19.207.958 [mindspore/train/serialization.py:1369] model.layers.8.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:19.776.135 [mindspore/train/serialization.py:1369] model.layers.8.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:20.387.394 [mindspore/train/serialization.py:1369] model.layers.9.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:20.388.393 [mindspore/train/serialization.py:1369] model.layers.9.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:20.388.878 [mindspore/train/serialization.py:1369] model.layers.9.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:20.555.320 [mindspore/train/serialization.py:1369] model.layers.9.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:20.629.052 [mindspore/train/serialization.py:1369] model.layers.9.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:20.674.564 [mindspore/train/serialization.py:1369] model.layers.9.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:20.843.816 [mindspore/train/serialization.py:1369] model.layers.9.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:21.437.161 [mindspore/train/serialization.py:1369] model.layers.9.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:22.373.96 [mindspore/train/serialization.py:1369] model.layers.9.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:22.603.990 [mindspore/train/serialization.py:1369] model.layers.10.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:22.604.973 [mindspore/train/serialization.py:1369] model.layers.10.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:22.605.459 [mindspore/train/serialization.py:1369] model.layers.10.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:22.786.374 [mindspore/train/serialization.py:1369] model.layers.10.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:22.833.913 [mindspore/train/serialization.py:1369] model.layers.10.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:22.882.644 [mindspore/train/serialization.py:1369] model.layers.10.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:23.536.84 [mindspore/train/serialization.py:1369] model.layers.10.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:23.612.581 [mindspore/train/serialization.py:1369] model.layers.10.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:24.179.081 [mindspore/train/serialization.py:1369] model.layers.10.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:24.743.999 [mindspore/train/serialization.py:1369] model.layers.11.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:24.745.042 [mindspore/train/serialization.py:1369] model.layers.11.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:24.745.567 [mindspore/train/serialization.py:1369] model.layers.11.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:24.911.317 [mindspore/train/serialization.py:1369] model.layers.11.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:24.962.001 [mindspore/train/serialization.py:1369] model.layers.11.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:25.839.8 [mindspore/train/serialization.py:1369] model.layers.11.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:25.182.150 [mindspore/train/serialization.py:1369] model.layers.11.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:25.795.312 [mindspore/train/serialization.py:1369] model.layers.11.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:26.385.026 [mindspore/train/serialization.py:1369] model.layers.11.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:26.973.852 [mindspore/train/serialization.py:1369] model.layers.12.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:26.974.818 [mindspore/train/serialization.py:1369] model.layers.12.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:26.975.281 [mindspore/train/serialization.py:1369] model.layers.12.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:27.139.265 [mindspore/train/serialization.py:1369] model.layers.12.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:27.187.094 [mindspore/train/serialization.py:1369] model.layers.12.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:27.233.546 [mindspore/train/serialization.py:1369] model.layers.12.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:27.402.890 [mindspore/train/serialization.py:1369] model.layers.12.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:27.994.950 [mindspore/train/serialization.py:1369] model.layers.12.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:28.595.786 [mindspore/train/serialization.py:1369] model.layers.12.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:29.186.225 [mindspore/train/serialization.py:1369] model.layers.13.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:29.187.166 [mindspore/train/serialization.py:1369] model.layers.13.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:29.187.695 [mindspore/train/serialization.py:1369] model.layers.13.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:29.353.848 [mindspore/train/serialization.py:1369] model.layers.13.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:29.401.773 [mindspore/train/serialization.py:1369] model.layers.13.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:29.448.892 [mindspore/train/serialization.py:1369] model.layers.13.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:29.614.882 [mindspore/train/serialization.py:1369] model.layers.13.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:30.220.146 [mindspore/train/serialization.py:1369] model.layers.13.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:30.793.058 [mindspore/train/serialization.py:1369] model.layers.13.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:31.365.482 [mindspore/train/serialization.py:1369] model.layers.14.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:31.366.408 [mindspore/train/serialization.py:1369] model.layers.14.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:31.366.907 [mindspore/train/serialization.py:1369] model.layers.14.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:31.529.077 [mindspore/train/serialization.py:1369] model.layers.14.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:31.581.980 [mindspore/train/serialization.py:1369] model.layers.14.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:31.630.543 [mindspore/train/serialization.py:1369] model.layers.14.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:31.804.232 [mindspore/train/serialization.py:1369] model.layers.14.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:32.400.625 [mindspore/train/serialization.py:1369] model.layers.14.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:32.993.792 [mindspore/train/serialization.py:1369] model.layers.14.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:33.590.077 [mindspore/train/serialization.py:1369] model.layers.15.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:33.590.990 [mindspore/train/serialization.py:1369] model.layers.15.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:33.591.479 [mindspore/train/serialization.py:1369] model.layers.15.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:33.773.659 [mindspore/train/serialization.py:1369] model.layers.15.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:33.849.445 [mindspore/train/serialization.py:1369] model.layers.15.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:33.896.374 [mindspore/train/serialization.py:1369] model.layers.15.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:34.824.64 [mindspore/train/serialization.py:1369] model.layers.15.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:34.755.958 [mindspore/train/serialization.py:1369] model.layers.15.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:35.337.450 [mindspore/train/serialization.py:1369] model.layers.15.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:35.906.543 [mindspore/train/serialization.py:1369] model.layers.16.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:35.907.754 [mindspore/train/serialization.py:1369] model.layers.16.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:35.908.288 [mindspore/train/serialization.py:1369] model.layers.16.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:36.706.35 [mindspore/train/serialization.py:1369] model.layers.16.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:36.119.525 [mindspore/train/serialization.py:1369] model.layers.16.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:36.170.624 [mindspore/train/serialization.py:1369] model.layers.16.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:36.348.610 [mindspore/train/serialization.py:1369] model.layers.16.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:36.951.445 [mindspore/train/serialization.py:1369] model.layers.16.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:37.534.580 [mindspore/train/serialization.py:1369] model.layers.16.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:38.111.332 [mindspore/train/serialization.py:1369] model.layers.17.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:38.112.244 [mindspore/train/serialization.py:1369] model.layers.17.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:38.112.778 [mindspore/train/serialization.py:1369] model.layers.17.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:38.284.206 [mindspore/train/serialization.py:1369] model.layers.17.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:38.334.273 [mindspore/train/serialization.py:1369] model.layers.17.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:38.379.617 [mindspore/train/serialization.py:1369] model.layers.17.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:38.560.397 [mindspore/train/serialization.py:1369] model.layers.17.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:39.134.794 [mindspore/train/serialization.py:1369] model.layers.17.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:39.695.963 [mindspore/train/serialization.py:1369] model.layers.17.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:40.274.668 [mindspore/train/serialization.py:1369] model.layers.18.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:40.275.620 [mindspore/train/serialization.py:1369] model.layers.18.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:40.276.125 [mindspore/train/serialization.py:1369] model.layers.18.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:40.447.426 [mindspore/train/serialization.py:1369] model.layers.18.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:40.494.859 [mindspore/train/serialization.py:1369] model.layers.18.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:40.566.679 [mindspore/train/serialization.py:1369] model.layers.18.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:40.754.063 [mindspore/train/serialization.py:1369] model.layers.18.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:41.328.132 [mindspore/train/serialization.py:1369] model.layers.18.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:41.899.781 [mindspore/train/serialization.py:1369] model.layers.18.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:42.498.028 [mindspore/train/serialization.py:1369] model.layers.19.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:42.498.960 [mindspore/train/serialization.py:1369] model.layers.19.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:42.499.470 [mindspore/train/serialization.py:1369] model.layers.19.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:42.671.060 [mindspore/train/serialization.py:1369] model.layers.19.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:42.719.604 [mindspore/train/serialization.py:1369] model.layers.19.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:42.764.623 [mindspore/train/serialization.py:1369] model.layers.19.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:42.935.510 [mindspore/train/serialization.py:1369] model.layers.19.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:43.541.287 [mindspore/train/serialization.py:1369] model.layers.19.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:44.178.112 [mindspore/train/serialization.py:1369] model.layers.19.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:44.810.616 [mindspore/train/serialization.py:1369] model.layers.20.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:44.812.579 [mindspore/train/serialization.py:1369] model.layers.20.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:44.813.083 [mindspore/train/serialization.py:1369] model.layers.20.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:45.351.00 [mindspore/train/serialization.py:1369] model.layers.20.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:45.135.011 [mindspore/train/serialization.py:1369] model.layers.20.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:45.190.757 [mindspore/train/serialization.py:1369] model.layers.20.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:45.357.482 [mindspore/train/serialization.py:1369] model.layers.20.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:45.973.119 [mindspore/train/serialization.py:1369] model.layers.20.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:46.586.681 [mindspore/train/serialization.py:1369] model.layers.20.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:47.172.027 [mindspore/train/serialization.py:1369] model.layers.21.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:47.173.103 [mindspore/train/serialization.py:1369] model.layers.21.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:47.173.656 [mindspore/train/serialization.py:1369] model.layers.21.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:47.352.123 [mindspore/train/serialization.py:1369] model.layers.21.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:47.403.776 [mindspore/train/serialization.py:1369] model.layers.21.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:47.450.229 [mindspore/train/serialization.py:1369] model.layers.21.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:47.626.757 [mindspore/train/serialization.py:1369] model.layers.21.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:48.216.671 [mindspore/train/serialization.py:1369] model.layers.21.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:48.818.744 [mindspore/train/serialization.py:1369] model.layers.21.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:49.405.928 [mindspore/train/serialization.py:1369] model.layers.22.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:49.406.937 [mindspore/train/serialization.py:1369] model.layers.22.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:49.407.463 [mindspore/train/serialization.py:1369] model.layers.22.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:49.585.680 [mindspore/train/serialization.py:1369] model.layers.22.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:49.633.315 [mindspore/train/serialization.py:1369] model.layers.22.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:49.681.098 [mindspore/train/serialization.py:1369] model.layers.22.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:49.856.428 [mindspore/train/serialization.py:1369] model.layers.22.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:50.443.347 [mindspore/train/serialization.py:1369] model.layers.22.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:51.508.65 [mindspore/train/serialization.py:1369] model.layers.22.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:51.637.983 [mindspore/train/serialization.py:1369] model.layers.23.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:51.639.035 [mindspore/train/serialization.py:1369] model.layers.23.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:51.639.626 [mindspore/train/serialization.py:1369] model.layers.23.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:51.820.399 [mindspore/train/serialization.py:1369] model.layers.23.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:51.868.605 [mindspore/train/serialization.py:1369] model.layers.23.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:51.914.760 [mindspore/train/serialization.py:1369] model.layers.23.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:52.885.81 [mindspore/train/serialization.py:1369] model.layers.23.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:52.669.639 [mindspore/train/serialization.py:1369] model.layers.23.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:53.245.085 [mindspore/train/serialization.py:1369] model.layers.23.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:53.848.479 [mindspore/train/serialization.py:1369] model.layers.24.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:53.849.446 [mindspore/train/serialization.py:1369] model.layers.24.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:53.849.997 [mindspore/train/serialization.py:1369] model.layers.24.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:54.212.17 [mindspore/train/serialization.py:1369] model.layers.24.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:54.695.24 [mindspore/train/serialization.py:1369] model.layers.24.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:54.116.877 [mindspore/train/serialization.py:1369] model.layers.24.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:54.293.709 [mindspore/train/serialization.py:1369] model.layers.24.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:54.876.007 [mindspore/train/serialization.py:1369] model.layers.24.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:55.448.398 [mindspore/train/serialization.py:1369] model.layers.24.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:56.420.14 [mindspore/train/serialization.py:1369] model.layers.25.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:56.429.54 [mindspore/train/serialization.py:1369] model.layers.25.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:56.435.06 [mindspore/train/serialization.py:1369] model.layers.25.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:56.210.342 [mindspore/train/serialization.py:1369] model.layers.25.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:56.268.571 [mindspore/train/serialization.py:1369] model.layers.25.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:56.317.529 [mindspore/train/serialization.py:1369] model.layers.25.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:56.544.426 [mindspore/train/serialization.py:1369] model.layers.25.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:57.144.593 [mindspore/train/serialization.py:1369] model.layers.25.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:57.722.383 [mindspore/train/serialization.py:1369] model.layers.25.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:58.366.006 [mindspore/train/serialization.py:1369] model.layers.26.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:58.366.996 [mindspore/train/serialization.py:1369] model.layers.26.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:58.367.552 [mindspore/train/serialization.py:1369] model.layers.26.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:58.568.700 [mindspore/train/serialization.py:1369] model.layers.26.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:58.613.760 [mindspore/train/serialization.py:1369] model.layers.26.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:58.658.317 [mindspore/train/serialization.py:1369] model.layers.26.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:58.835.209 [mindspore/train/serialization.py:1369] model.layers.26.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:10:59.446.823 [mindspore/train/serialization.py:1369] model.layers.26.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:00.800.38 [mindspore/train/serialization.py:1369] model.layers.26.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:00.680.312 [mindspore/train/serialization.py:1369] model.layers.27.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:00.681.399 [mindspore/train/serialization.py:1369] model.layers.27.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:00.681.960 [mindspore/train/serialization.py:1369] model.layers.27.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:00.854.149 [mindspore/train/serialization.py:1369] model.layers.27.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:00.904.378 [mindspore/train/serialization.py:1369] model.layers.27.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:00.952.799 [mindspore/train/serialization.py:1369] model.layers.27.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:01.136.472 [mindspore/train/serialization.py:1369] model.layers.27.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:01.722.359 [mindspore/train/serialization.py:1369] model.layers.27.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:02.317.874 [mindspore/train/serialization.py:1369] model.layers.27.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:02.906.263 [mindspore/train/serialization.py:1369] model.layers.28.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:02.907.207 [mindspore/train/serialization.py:1369] model.layers.28.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:02.907.721 [mindspore/train/serialization.py:1369] model.layers.28.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:03.812.86 [mindspore/train/serialization.py:1369] model.layers.28.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:03.133.960 [mindspore/train/serialization.py:1369] model.layers.28.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:03.182.317 [mindspore/train/serialization.py:1369] model.layers.28.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:03.360.885 [mindspore/train/serialization.py:1369] model.layers.28.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:03.950.515 [mindspore/train/serialization.py:1369] model.layers.28.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:04.549.532 [mindspore/train/serialization.py:1369] model.layers.28.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:05.155.445 [mindspore/train/serialization.py:1369] model.layers.29.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:05.156.411 [mindspore/train/serialization.py:1369] model.layers.29.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:05.156.973 [mindspore/train/serialization.py:1369] model.layers.29.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:05.328.581 [mindspore/train/serialization.py:1369] model.layers.29.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:05.377.951 [mindspore/train/serialization.py:1369] model.layers.29.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:05.424.121 [mindspore/train/serialization.py:1369] model.layers.29.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:05.596.637 [mindspore/train/serialization.py:1369] model.layers.29.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:06.171.639 [mindspore/train/serialization.py:1369] model.layers.29.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:06.781.088 [mindspore/train/serialization.py:1369] model.layers.29.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:07.366.269 [mindspore/train/serialization.py:1369] model.layers.30.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:07.367.214 [mindspore/train/serialization.py:1369] model.layers.30.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:07.367.733 [mindspore/train/serialization.py:1369] model.layers.30.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:07.540.317 [mindspore/train/serialization.py:1369] model.layers.30.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:07.589.500 [mindspore/train/serialization.py:1369] model.layers.30.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:07.633.939 [mindspore/train/serialization.py:1369] model.layers.30.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:07.829.611 [mindspore/train/serialization.py:1369] model.layers.30.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:08.413.942 [mindspore/train/serialization.py:1369] model.layers.30.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:09.907.8 [mindspore/train/serialization.py:1369] model.layers.30.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:09.592.298 [mindspore/train/serialization.py:1369] model.layers.31.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:09.593.306 [mindspore/train/serialization.py:1369] model.layers.31.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:09.593.826 [mindspore/train/serialization.py:1369] model.layers.31.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:09.768.254 [mindspore/train/serialization.py:1369] model.layers.31.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:09.817.245 [mindspore/train/serialization.py:1369] model.layers.31.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:09.862.376 [mindspore/train/serialization.py:1369] model.layers.31.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:10.383.49 [mindspore/train/serialization.py:1369] model.layers.31.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:10.632.456 [mindspore/train/serialization.py:1369] model.layers.31.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:11.221.961 [mindspore/train/serialization.py:1369] model.layers.31.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:11.825.828 [mindspore/train/serialization.py:1369] model.norm_out.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:11.826.793 [mindspore/train/serialization.py:1369] lm_head.weight is not init while load ckpt. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:45.652.031 [mindspore/train/serialization.py:195] The type of model.layers.0.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:45.656.832 [mindspore/train/serialization.py:195] The type of model.layers.0.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:56.407.50 [mindspore/train/serialization.py:195] The type of model.layers.1.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:11:56.447.72 [mindspore/train/serialization.py:195] The type of model.layers.1.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:12:06.184.136 [mindspore/train/serialization.py:195] The type of model.layers.2.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:12:06.188.302 [mindspore/train/serialization.py:195] The type of model.layers.2.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:12:16.426.583 [mindspore/train/serialization.py:195] The type of model.layers.3.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:12:16.430.604 [mindspore/train/serialization.py:195] The type of model.layers.3.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:12:26.641.455 [mindspore/train/serialization.py:195] The type of model.layers.4.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:12:26.645.528 [mindspore/train/serialization.py:195] The type of model.layers.4.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:12:36.763.800 [mindspore/train/serialization.py:195] The type of model.layers.5.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:12:36.767.953 [mindspore/train/serialization.py:195] The type of model.layers.5.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:12:46.986.238 [mindspore/train/serialization.py:195] The type of model.layers.6.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:12:46.990.243 [mindspore/train/serialization.py:195] The type of model.layers.6.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:12:57.138.543 [mindspore/train/serialization.py:195] The type of model.layers.7.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:12:57.142.750 [mindspore/train/serialization.py:195] The type of model.layers.7.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:13:07.358.329 [mindspore/train/serialization.py:195] The type of model.layers.8.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:13:07.362.316 [mindspore/train/serialization.py:195] The type of model.layers.8.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:13:17.518.541 [mindspore/train/serialization.py:195] The type of model.layers.9.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:13:17.522.581 [mindspore/train/serialization.py:195] The type of model.layers.9.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:13:27.727.621 [mindspore/train/serialization.py:195] The type of model.layers.10.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:13:27.731.786 [mindspore/train/serialization.py:195] The type of model.layers.10.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:13:37.968.600 [mindspore/train/serialization.py:195] The type of model.layers.11.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:13:37.972.748 [mindspore/train/serialization.py:195] The type of model.layers.11.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:13:48.118.740 [mindspore/train/serialization.py:195] The type of model.layers.12.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:13:48.122.960 [mindspore/train/serialization.py:195] The type of model.layers.12.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:13:58.386.093 [mindspore/train/serialization.py:195] The type of model.layers.13.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:13:58.390.153 [mindspore/train/serialization.py:195] The type of model.layers.13.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:14:08.564.812 [mindspore/train/serialization.py:195] The type of model.layers.14.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:14:08.568.891 [mindspore/train/serialization.py:195] The type of model.layers.14.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:14:18.767.522 [mindspore/train/serialization.py:195] The type of model.layers.15.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:14:18.771.731 [mindspore/train/serialization.py:195] The type of model.layers.15.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:14:28.963.875 [mindspore/train/serialization.py:195] The type of model.layers.16.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:14:28.967.931 [mindspore/train/serialization.py:195] The type of model.layers.16.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:14:39.103.786 [mindspore/train/serialization.py:195] The type of model.layers.17.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:14:39.108.029 [mindspore/train/serialization.py:195] The type of model.layers.17.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:14:49.337.548 [mindspore/train/serialization.py:195] The type of model.layers.18.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:14:49.341.644 [mindspore/train/serialization.py:195] The type of model.layers.18.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:14:59.559.218 [mindspore/train/serialization.py:195] The type of model.layers.19.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:14:59.563.287 [mindspore/train/serialization.py:195] The type of model.layers.19.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:15:09.807.625 [mindspore/train/serialization.py:195] The type of model.layers.20.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:15:09.812.323 [mindspore/train/serialization.py:195] The type of model.layers.20.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:15:20.146.18 [mindspore/train/serialization.py:195] The type of model.layers.21.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:15:20.187.22 [mindspore/train/serialization.py:195] The type of model.layers.21.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:15:30.256.201 [mindspore/train/serialization.py:195] The type of model.layers.22.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:15:30.260.392 [mindspore/train/serialization.py:195] The type of model.layers.22.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:15:40.526.357 [mindspore/train/serialization.py:195] The type of model.layers.23.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:15:40.530.413 [mindspore/train/serialization.py:195] The type of model.layers.23.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:15:50.771.728 [mindspore/train/serialization.py:195] The type of model.layers.24.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:15:50.775.868 [mindspore/train/serialization.py:195] The type of model.layers.24.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:16:00.994.190 [mindspore/train/serialization.py:195] The type of model.layers.25.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:16:00.998.392 [mindspore/train/serialization.py:195] The type of model.layers.25.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:16:11.278.515 [mindspore/train/serialization.py:195] The type of model.layers.26.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:16:11.282.513 [mindspore/train/serialization.py:195] The type of model.layers.26.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:16:21.547.620 [mindspore/train/serialization.py:195] The type of model.layers.27.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:16:21.551.812 [mindspore/train/serialization.py:195] The type of model.layers.27.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:16:31.893.311 [mindspore/train/serialization.py:195] The type of model.layers.28.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:16:31.897.506 [mindspore/train/serialization.py:195] The type of model.layers.28.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:16:42.191.563 [mindspore/train/serialization.py:195] The type of model.layers.29.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:16:42.195.841 [mindspore/train/serialization.py:195] The type of model.layers.29.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:16:52.475.984 [mindspore/train/serialization.py:195] The type of model.layers.30.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:16:52.480.073 [mindspore/train/serialization.py:195] The type of model.layers.30.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:17:02.767.823 [mindspore/train/serialization.py:195] The type of model.layers.31.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:17:02.771.932 [mindspore/train/serialization.py:195] The type of model.layers.31.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:17:13.722.1 [mindspore/train/serialization.py:195] The type of model.norm_out.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:17:37.881.572 [mindspore/train/serialization.py:1456] For 'load_param_into_net', 128 parameters in the 'net' are not loaded, because they are not in the 'parameter_dict', please check whether the network structure is consistent when training and loading checkpoint. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:17:37.882.044 [mindspore/train/serialization.py:1460] ['model.layers.0.attention.wq.mindpet_delta_lora_a', 'model.layers.0.attention.wq.mindpet_delta_lora_b', 'model.layers.0.attention.wv.mindpet_delta_lora_a', 'model.layers.0.attention.wv.mindpet_delta_lora_b', 'model.layers.1.attention.wq.mindpet_delta_lora_a', 'model.layers.1.attention.wq.mindpet_delta_lora_b', 'model.layers.1.attention.wv.mindpet_delta_lora_a', 'model.layers.1.attention.wv.mindpet_delta_lora_b', 'model.layers.2.attention.wq.mindpet_delta_lora_a', 'model.layers.2.attention.wq.mindpet_delta_lora_b', 'model.layers.2.attention.wv.mindpet_delta_lora_a', 'model.layers.2.attention.wv.mindpet_delta_lora_b', 'model.layers.3.attention.wq.mindpet_delta_lora_a', 'model.layers.3.attention.wq.mindpet_delta_lora_b', 'model.layers.3.attention.wv.mindpet_delta_lora_a', 'model.layers.3.attention.wv.mindpet_delta_lora_b', 'model.layers.4.attention.wq.mindpet_delta_lora_a', 'model.layers.4.attention.wq.mindpet_delta_lora_b', 'model.layers.4.attention.wv.mindpet_delta_lora_a', 'model.layers.4.attention.wv.mindpet_delta_lora_b', 'model.layers.5.attention.wq.mindpet_delta_lora_a', 'model.layers.5.attention.wq.mindpet_delta_lora_b', 'model.layers.5.attention.wv.mindpet_delta_lora_a', 'model.layers.5.attention.wv.mindpet_delta_lora_b', 'model.layers.6.attention.wq.mindpet_delta_lora_a', 'model.layers.6.attention.wq.mindpet_delta_lora_b', 'model.layers.6.attention.wv.mindpet_delta_lora_a', 'model.layers.6.attention.wv.mindpet_delta_lora_b', 'model.layers.7.attention.wq.mindpet_delta_lora_a', 'model.layers.7.attention.wq.mindpet_delta_lora_b', 'model.layers.7.attention.wv.mindpet_delta_lora_a', 'model.layers.7.attention.wv.mindpet_delta_lora_b', 'model.layers.8.attention.wq.mindpet_delta_lora_a', 'model.layers.8.attention.wq.mindpet_delta_lora_b', 'model.layers.8.attention.wv.mindpet_delta_lora_a', 'model.layers.8.attention.wv.mindpet_delta_lora_b', 'model.layers.9.attention.wq.mindpet_delta_lora_a', 'model.layers.9.attention.wq.mindpet_delta_lora_b', 'model.layers.9.attention.wv.mindpet_delta_lora_a', 'model.layers.9.attention.wv.mindpet_delta_lora_b', 'model.layers.10.attention.wq.mindpet_delta_lora_a', 'model.layers.10.attention.wq.mindpet_delta_lora_b', 'model.layers.10.attention.wv.mindpet_delta_lora_a', 'model.layers.10.attention.wv.mindpet_delta_lora_b', 'model.layers.11.attention.wq.mindpet_delta_lora_a', 'model.layers.11.attention.wq.mindpet_delta_lora_b', 'model.layers.11.attention.wv.mindpet_delta_lora_a', 'model.layers.11.attention.wv.mindpet_delta_lora_b', 'model.layers.12.attention.wq.mindpet_delta_lora_a', 'model.layers.12.attention.wq.mindpet_delta_lora_b', 'model.layers.12.attention.wv.mindpet_delta_lora_a', 'model.layers.12.attention.wv.mindpet_delta_lora_b', 'model.layers.13.attention.wq.mindpet_delta_lora_a', 'model.layers.13.attention.wq.mindpet_delta_lora_b', 'model.layers.13.attention.wv.mindpet_delta_lora_a', 'model.layers.13.attention.wv.mindpet_delta_lora_b', 'model.layers.14.attention.wq.mindpet_delta_lora_a', 'model.layers.14.attention.wq.mindpet_delta_lora_b', 'model.layers.14.attention.wv.mindpet_delta_lora_a', 'model.layers.14.attention.wv.mindpet_delta_lora_b', 'model.layers.15.attention.wq.mindpet_delta_lora_a', 'model.layers.15.attention.wq.mindpet_delta_lora_b', 'model.layers.15.attention.wv.mindpet_delta_lora_a', 'model.layers.15.attention.wv.mindpet_delta_lora_b', 'model.layers.16.attention.wq.mindpet_delta_lora_a', 'model.layers.16.attention.wq.mindpet_delta_lora_b', 'model.layers.16.attention.wv.mindpet_delta_lora_a', 'model.layers.16.attention.wv.mindpet_delta_lora_b', 'model.layers.17.attention.wq.mindpet_delta_lora_a', 'model.layers.17.attention.wq.mindpet_delta_lora_b', 'model.layers.17.attention.wv.mindpet_delta_lora_a', 'model.layers.17.attention.wv.mindpet_delta_lora_b', 'model.layers.18.attention.wq.mindpet_delta_lora_a', 'model.layers.18.attention.wq.mindpet_delta_lora_b', 'model.layers.18.attention.wv.mindpet_delta_lora_a', 'model.layers.18.attention.wv.mindpet_delta_lora_b', 'model.layers.19.attention.wq.mindpet_delta_lora_a', 'model.layers.19.attention.wq.mindpet_delta_lora_b', 'model.layers.19.attention.wv.mindpet_delta_lora_a', 'model.layers.19.attention.wv.mindpet_delta_lora_b', 'model.layers.20.attention.wq.mindpet_delta_lora_a', 'model.layers.20.attention.wq.mindpet_delta_lora_b', 'model.layers.20.attention.wv.mindpet_delta_lora_a', 'model.layers.20.attention.wv.mindpet_delta_lora_b', 'model.layers.21.attention.wq.mindpet_delta_lora_a', 'model.layers.21.attention.wq.mindpet_delta_lora_b', 'model.layers.21.attention.wv.mindpet_delta_lora_a', 'model.layers.21.attention.wv.mindpet_delta_lora_b', 'model.layers.22.attention.wq.mindpet_delta_lora_a', 'model.layers.22.attention.wq.mindpet_delta_lora_b', 'model.layers.22.attention.wv.mindpet_delta_lora_a', 'model.layers.22.attention.wv.mindpet_delta_lora_b', 'model.layers.23.attention.wq.mindpet_delta_lora_a', 'model.layers.23.attention.wq.mindpet_delta_lora_b', 'model.layers.23.attention.wv.mindpet_delta_lora_a', 'model.layers.23.attention.wv.mindpet_delta_lora_b', 'model.layers.24.attention.wq.mindpet_delta_lora_a', 'model.layers.24.attention.wq.mindpet_delta_lora_b', 'model.layers.24.attention.wv.mindpet_delta_lora_a', 'model.layers.24.attention.wv.mindpet_delta_lora_b', 'model.layers.25.attention.wq.mindpet_delta_lora_a', 'model.layers.25.attention.wq.mindpet_delta_lora_b', 'model.layers.25.attention.wv.mindpet_delta_lora_a', 'model.layers.25.attention.wv.mindpet_delta_lora_b', 'model.layers.26.attention.wq.mindpet_delta_lora_a', 'model.layers.26.attention.wq.mindpet_delta_lora_b', 'model.layers.26.attention.wv.mindpet_delta_lora_a', 'model.layers.26.attention.wv.mindpet_delta_lora_b', 'model.layers.27.attention.wq.mindpet_delta_lora_a', 'model.layers.27.attention.wq.mindpet_delta_lora_b', 'model.layers.27.attention.wv.mindpet_delta_lora_a', 'model.layers.27.attention.wv.mindpet_delta_lora_b', 'model.layers.28.attention.wq.mindpet_delta_lora_a', 'model.layers.28.attention.wq.mindpet_delta_lora_b', 'model.layers.28.attention.wv.mindpet_delta_lora_a', 'model.layers.28.attention.wv.mindpet_delta_lora_b', 'model.layers.29.attention.wq.mindpet_delta_lora_a', 'model.layers.29.attention.wq.mindpet_delta_lora_b', 'model.layers.29.attention.wv.mindpet_delta_lora_a', 'model.layers.29.attention.wv.mindpet_delta_lora_b', 'model.layers.30.attention.wq.mindpet_delta_lora_a', 'model.layers.30.attention.wq.mindpet_delta_lora_b', 'model.layers.30.attention.wv.mindpet_delta_lora_a', 'model.layers.30.attention.wv.mindpet_delta_lora_b', 'model.layers.31.attention.wq.mindpet_delta_lora_a', 'model.layers.31.attention.wq.mindpet_delta_lora_b', 'model.layers.31.attention.wv.mindpet_delta_lora_a', 'model.layers.31.attention.wv.mindpet_delta_lora_b'] are not loaded. +2024-07-30 02:17:37,882 - mindformers[mindformers/trainer/utils.py:767] - INFO - Network parameters are not loaded: (['model.layers.0.attention.wq.mindpet_delta_lora_a', 'model.layers.0.attention.wq.mindpet_delta_lora_b', 'model.layers.0.attention.wv.mindpet_delta_lora_a', 'model.layers.0.attention.wv.mindpet_delta_lora_b', 'model.layers.1.attention.wq.mindpet_delta_lora_a', 'model.layers.1.attention.wq.mindpet_delta_lora_b', 'model.layers.1.attention.wv.mindpet_delta_lora_a', 'model.layers.1.attention.wv.mindpet_delta_lora_b', 'model.layers.2.attention.wq.mindpet_delta_lora_a', 'model.layers.2.attention.wq.mindpet_delta_lora_b', 'model.layers.2.attention.wv.mindpet_delta_lora_a', 'model.layers.2.attention.wv.mindpet_delta_lora_b', 'model.layers.3.attention.wq.mindpet_delta_lora_a', 'model.layers.3.attention.wq.mindpet_delta_lora_b', 'model.layers.3.attention.wv.mindpet_delta_lora_a', 'model.layers.3.attention.wv.mindpet_delta_lora_b', 'model.layers.4.attention.wq.mindpet_delta_lora_a', 'model.layers.4.attention.wq.mindpet_delta_lora_b', 'model.layers.4.attention.wv.mindpet_delta_lora_a', 'model.layers.4.attention.wv.mindpet_delta_lora_b', 'model.layers.5.attention.wq.mindpet_delta_lora_a', 'model.layers.5.attention.wq.mindpet_delta_lora_b', 'model.layers.5.attention.wv.mindpet_delta_lora_a', 'model.layers.5.attention.wv.mindpet_delta_lora_b', 'model.layers.6.attention.wq.mindpet_delta_lora_a', 'model.layers.6.attention.wq.mindpet_delta_lora_b', 'model.layers.6.attention.wv.mindpet_delta_lora_a', 'model.layers.6.attention.wv.mindpet_delta_lora_b', 'model.layers.7.attention.wq.mindpet_delta_lora_a', 'model.layers.7.attention.wq.mindpet_delta_lora_b', 'model.layers.7.attention.wv.mindpet_delta_lora_a', 'model.layers.7.attention.wv.mindpet_delta_lora_b', 'model.layers.8.attention.wq.mindpet_delta_lora_a', 'model.layers.8.attention.wq.mindpet_delta_lora_b', 'model.layers.8.attention.wv.mindpet_delta_lora_a', 'model.layers.8.attention.wv.mindpet_delta_lora_b', 'model.layers.9.attention.wq.mindpet_delta_lora_a', 'model.layers.9.attention.wq.mindpet_delta_lora_b', 'model.layers.9.attention.wv.mindpet_delta_lora_a', 'model.layers.9.attention.wv.mindpet_delta_lora_b', 'model.layers.10.attention.wq.mindpet_delta_lora_a', 'model.layers.10.attention.wq.mindpet_delta_lora_b', 'model.layers.10.attention.wv.mindpet_delta_lora_a', 'model.layers.10.attention.wv.mindpet_delta_lora_b', 'model.layers.11.attention.wq.mindpet_delta_lora_a', 'model.layers.11.attention.wq.mindpet_delta_lora_b', 'model.layers.11.attention.wv.mindpet_delta_lora_a', 'model.layers.11.attention.wv.mindpet_delta_lora_b', 'model.layers.12.attention.wq.mindpet_delta_lora_a', 'model.layers.12.attention.wq.mindpet_delta_lora_b', 'model.layers.12.attention.wv.mindpet_delta_lora_a', 'model.layers.12.attention.wv.mindpet_delta_lora_b', 'model.layers.13.attention.wq.mindpet_delta_lora_a', 'model.layers.13.attention.wq.mindpet_delta_lora_b', 'model.layers.13.attention.wv.mindpet_delta_lora_a', 'model.layers.13.attention.wv.mindpet_delta_lora_b', 'model.layers.14.attention.wq.mindpet_delta_lora_a', 'model.layers.14.attention.wq.mindpet_delta_lora_b', 'model.layers.14.attention.wv.mindpet_delta_lora_a', 'model.layers.14.attention.wv.mindpet_delta_lora_b', 'model.layers.15.attention.wq.mindpet_delta_lora_a', 'model.layers.15.attention.wq.mindpet_delta_lora_b', 'model.layers.15.attention.wv.mindpet_delta_lora_a', 'model.layers.15.attention.wv.mindpet_delta_lora_b', 'model.layers.16.attention.wq.mindpet_delta_lora_a', 'model.layers.16.attention.wq.mindpet_delta_lora_b', 'model.layers.16.attention.wv.mindpet_delta_lora_a', 'model.layers.16.attention.wv.mindpet_delta_lora_b', 'model.layers.17.attention.wq.mindpet_delta_lora_a', 'model.layers.17.attention.wq.mindpet_delta_lora_b', 'model.layers.17.attention.wv.mindpet_delta_lora_a', 'model.layers.17.attention.wv.mindpet_delta_lora_b', 'model.layers.18.attention.wq.mindpet_delta_lora_a', 'model.layers.18.attention.wq.mindpet_delta_lora_b', 'model.layers.18.attention.wv.mindpet_delta_lora_a', 'model.layers.18.attention.wv.mindpet_delta_lora_b', 'model.layers.19.attention.wq.mindpet_delta_lora_a', 'model.layers.19.attention.wq.mindpet_delta_lora_b', 'model.layers.19.attention.wv.mindpet_delta_lora_a', 'model.layers.19.attention.wv.mindpet_delta_lora_b', 'model.layers.20.attention.wq.mindpet_delta_lora_a', 'model.layers.20.attention.wq.mindpet_delta_lora_b', 'model.layers.20.attention.wv.mindpet_delta_lora_a', 'model.layers.20.attention.wv.mindpet_delta_lora_b', 'model.layers.21.attention.wq.mindpet_delta_lora_a', 'model.layers.21.attention.wq.mindpet_delta_lora_b', 'model.layers.21.attention.wv.mindpet_delta_lora_a', 'model.layers.21.attention.wv.mindpet_delta_lora_b', 'model.layers.22.attention.wq.mindpet_delta_lora_a', 'model.layers.22.attention.wq.mindpet_delta_lora_b', 'model.layers.22.attention.wv.mindpet_delta_lora_a', 'model.layers.22.attention.wv.mindpet_delta_lora_b', 'model.layers.23.attention.wq.mindpet_delta_lora_a', 'model.layers.23.attention.wq.mindpet_delta_lora_b', 'model.layers.23.attention.wv.mindpet_delta_lora_a', 'model.layers.23.attention.wv.mindpet_delta_lora_b', 'model.layers.24.attention.wq.mindpet_delta_lora_a', 'model.layers.24.attention.wq.mindpet_delta_lora_b', 'model.layers.24.attention.wv.mindpet_delta_lora_a', 'model.layers.24.attention.wv.mindpet_delta_lora_b', 'model.layers.25.attention.wq.mindpet_delta_lora_a', 'model.layers.25.attention.wq.mindpet_delta_lora_b', 'model.layers.25.attention.wv.mindpet_delta_lora_a', 'model.layers.25.attention.wv.mindpet_delta_lora_b', 'model.layers.26.attention.wq.mindpet_delta_lora_a', 'model.layers.26.attention.wq.mindpet_delta_lora_b', 'model.layers.26.attention.wv.mindpet_delta_lora_a', 'model.layers.26.attention.wv.mindpet_delta_lora_b', 'model.layers.27.attention.wq.mindpet_delta_lora_a', 'model.layers.27.attention.wq.mindpet_delta_lora_b', 'model.layers.27.attention.wv.mindpet_delta_lora_a', 'model.layers.27.attention.wv.mindpet_delta_lora_b', 'model.layers.28.attention.wq.mindpet_delta_lora_a', 'model.layers.28.attention.wq.mindpet_delta_lora_b', 'model.layers.28.attention.wv.mindpet_delta_lora_a', 'model.layers.28.attention.wv.mindpet_delta_lora_b', 'model.layers.29.attention.wq.mindpet_delta_lora_a', 'model.layers.29.attention.wq.mindpet_delta_lora_b', 'model.layers.29.attention.wv.mindpet_delta_lora_a', 'model.layers.29.attention.wv.mindpet_delta_lora_b', 'model.layers.30.attention.wq.mindpet_delta_lora_a', 'model.layers.30.attention.wq.mindpet_delta_lora_b', 'model.layers.30.attention.wv.mindpet_delta_lora_a', 'model.layers.30.attention.wv.mindpet_delta_lora_b', 'model.layers.31.attention.wq.mindpet_delta_lora_a', 'model.layers.31.attention.wq.mindpet_delta_lora_b', 'model.layers.31.attention.wv.mindpet_delta_lora_a', 'model.layers.31.attention.wv.mindpet_delta_lora_b'], []) +2024-07-30 02:17:37,883 - mindformers[mindformers/trainer/base_trainer.py:770] - INFO - .........Starting Training Model.......... +{'auto_trans_ckpt': False, + 'auto_tune': False, + 'autotune_per_step': 10, + 'callbacks': [OrderedDict([('type', 'MFLossMonitor')]), + OrderedDict([('type', 'CheckpointMointor'), + ('prefix', 'llama3_8b'), + ('save_checkpoint_steps', 1400), + ('integrated_save', False), + ('async_save', False)]), + OrderedDict([('type', 'ObsMonitor')])], + 'context': {'device_target': 'Ascend', + 'enable_graph_kernel': False, + 'graph_kernel_flags': '--disable_expand_ops=Softmax,Dropout ' + '--enable_parallel_fusion=true ' + '--reduce_fuse_depth=8 ' + '--enable_auto_tensor_inplace=true', + 'max_call_depth': 10000, + 'runtime_num_threads': 1, + 'save_graphs': False, + 'save_graphs_path': './graph'}, + 'data_size': 3125, + 'device_num': 4, + 'do_eval': False, + 'eval_callbacks': [OrderedDict([('type', 'ObsMonitor')])], + 'eval_dataset': {'auto_tune': False, + 'autotune_per_step': 10, + 'batch_size': 32, + 'data_loader': {'dataset_dir': '', + 'shuffle': False, + 'type': 'MindDataset'}, + 'do_eval': True, + 'drop_remainder': False, + 'filepath_prefix': './autotune', + 'input_columns': ['input_ids'], + 'num_parallel_workers': 8, + 'numa_enable': False, + 'output_columns': ['input_ids'], + 'prefetch_size': 1, + 'profile': False, + 'python_multiprocessing': False, + 'repeat': 1, + 'seed': 0}, + 'eval_dataset_task': {'dataset_config': {'auto_tune': False, + 'autotune_per_step': 10, + 'batch_size': 32, + 'data_loader': {'dataset_dir': '', + 'shuffle': False, + 'type': 'MindDataset'}, + 'do_eval': True, + 'drop_remainder': False, + 'filepath_prefix': './autotune', + 'input_columns': ['input_ids'], + 'num_parallel_workers': 8, + 'numa_enable': False, + 'output_columns': ['input_ids'], + 'prefetch_size': 1, + 'profile': False, + 'python_multiprocessing': False, + 'repeat': 1, + 'seed': 0}, + 'type': 'CausalLanguageModelDataset'}, + 'filepath_prefix': './autotune', + 'init_start_profile': False, + 'layer_decay': 0.65, + 'layer_scale': False, + 'load_checkpoint': '/home/ma-user/work/llama3-8B.ckpt', + 'local_rank': 0, + 'lr_scale_factor': 256, + 'lr_schedule': {'learning_rate': 1e-05, + 'lr_end': 0.0, + 'total_steps': 9374, + 'type': 'CosineWithWarmUpLR', + 'warmup_steps': 281}, + 'metric': [{'type': 'PerplexityMetric'}], + 'micro_batch_interleave_num': 1, + 'model': {'arch': {'type': 'LlamaForCausalLM'}, + 'model_config': {'batch_size': 32, + 'bos_token_id': 128000, + 'checkpoint_name_or_path': None, + 'compute_dtype': 'bfloat16', + 'do_sample': False, + 'eos_token_id': 128001, + 'extend_method': 'None', + 'fine_grain_interleave': 1, + 'hidden_size': 4096, + 'ignore_token_id': -100, + 'intermediate_size': 14336, + 'layernorm_compute_type': 'float32', + 'max_decode_length': 512, + 'n_kv_heads': 8, + 'num_heads': 32, + 'num_layers': 32, + 'offset': 0, + 'pad_token_id': 128002, + 'param_init_type': 'bfloat16', + 'pet_config': {'lora_alpha': 16, + 'lora_dropout': 0.0, + 'lora_rank': 8, + 'target_modules': '.*wq|.*wv'}, + 'repetition_penalty': 1, + 'rms_norm_eps': 1e-05, + 'rotary_dtype': 'float32', + 'scaling_factor': 1.0, + 'seq_length': 256, + 'softmax_compute_type': 'float32', + 'theta': 500000, + 'top_k': 3, + 'top_p': 1, + 'type': 'LlamaConfig', + 'use_flash_attention': True, + 'use_past': False, + 'vocab_size': 128256}}, + 'moe_config': , + 'only_save_strategy': False, + 'optimizer': {'beta1': 0.9, + 'beta2': 0.95, + 'eps': 1e-08, + 'type': 'FP32StateAdamWeightDecay'}, + 'output_dir': './output', + 'parallel': {'device_num': 4, + 'enable_alltoall': False, + 'enable_parallel_optimizer': True, + 'full_batch': True, + 'gradients_mean': False, + 'parallel_mode': 'semi_auto_parallel', + 'parallel_optimizer_config': {'gradient_accumulation_shard': False, + 'parallel_optimizer_threshold': 64}, + 'search_mode': 'sharding_propagation', + 'strategy_ckpt_config': {'only_trainable_params': False, + 'save_file': './ckpt_strategy.ckpt'}, + 'strategy_ckpt_save_file': './output/strategy/ckpt_strategy_rank_0.ckpt'}, + 'parallel_config': , + 'profile': False, + 'profile_communication': False, + 'profile_memory': True, + 'profile_start_step': 4, + 'profile_stop_step': 8, + 'rank_id': 0, + 'recompute_config': , + 'remote_save_url': '', + 'resume_training': False, + 'run_mode': 'finetune', + 'runner_config': {'batch_size': 32, + 'epochs': 4687, + 'gradient_accumulation_steps': 1, + 'initial_epoch': 0, + 'initial_step': 0, + 'origin_epochs': 3, + 'sink_mode': True, + 'sink_size': 2}, + 'runner_wrapper': {'scale_sense': 1.0, + 'type': 'MFTrainOneStepCell', + 'use_clip_grad': True}, + 'seed': 0, + 'src_strategy_path_or_dir': '', + 'train_dataset': {'auto_tune': False, + 'autotune_per_step': 10, + 'batch_size': 32, + 'data_loader': {'dataset_dir': '/home/ma-user/work/trainset-v2-fastchat256.mindrecord', + 'shuffle': True, + 'type': 'MindDataset'}, + 'do_eval': False, + 'drop_remainder': True, + 'filepath_prefix': './autotune', + 'input_columns': ['input_ids', 'labels'], + 'num_parallel_workers': 8, + 'numa_enable': False, + 'output_columns': ['input_ids', 'labels'], + 'prefetch_size': 1, + 'profile': False, + 'python_multiprocessing': False, + 'repeat': 1, + 'seed': 0}, + 'train_dataset_task': {'dataset_config': {'auto_tune': False, + 'autotune_per_step': 10, + 'batch_size': 32, + 'data_loader': {'dataset_dir': '/home/ma-user/work/trainset-v2-fastchat256.mindrecord', + 'shuffle': True, + 'type': 'MindDataset'}, + 'do_eval': False, + 'drop_remainder': True, + 'filepath_prefix': './autotune', + 'input_columns': ['input_ids', + 'labels'], + 'num_parallel_workers': 8, + 'numa_enable': False, + 'output_columns': ['input_ids', + 'labels'], + 'prefetch_size': 1, + 'profile': False, + 'python_multiprocessing': False, + 'repeat': 1, + 'seed': 0}, + 'type': 'CausalLanguageModelDataset'}, + 'trainer': {'model_name': 'llama3_8b', + 'type': 'CausalLanguageModelingTrainer'}, + 'use_parallel': True} +2024-07-30 02:17:37,890 - mindformers[mindformers/trainer/base_trainer.py:773] - INFO - .........Model Compiling, Please Wait a Moment........... +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:17:37.891.420 [mindspore/train/model.py:1120] For MFLossMonitor callback, {'epoch_begin', 'step_begin', 'step_end', 'epoch_end'} methods may not be supported in later version, Use methods prefixed with 'on_train' or 'on_eval' instead when using customized callbacks. +[WARNING] ME(978967:281472948264976,MainProcess):2024-07-30-02:17:37.891.597 [mindspore/train/model.py:1120] For Local2ObsMonitor callback, {'step_end', 'epoch_end'} methods may not be supported in later version, Use methods prefixed with 'on_train' or 'on_eval' instead when using customized callbacks. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.079.087 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/31-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.079.879 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/30-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.080.584 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/29-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.081.265 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/28-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.081.939 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/27-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.082.615 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/26-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.083.285 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/25-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.083.954 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/24-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.084.639 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/23-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.085.339 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/22-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.086.016 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/21-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.086.671 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/20-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.087.329 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/19-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.087.987 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/18-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.088.660 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/17-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.089.327 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/16-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.089.983 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/15-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.090.660 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/14-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.091.311 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/13-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.091.960 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/12-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.092.629 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/11-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.093.273 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/10-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.093.925 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/9-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.094.586 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/8-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.095.236 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/7-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.095.904 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/6-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.096.571 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/5-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.097.226 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/4-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.097.878 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/3-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.098.530 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/2-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.099.186 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/1-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.099.833 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/0-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.100.294 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/0-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.101.063 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/1-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.101.804 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/2-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.102.542 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/3-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.103.259 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/4-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.103.989 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/5-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.104.749 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/6-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.105.488 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/7-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.106.224 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/8-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.106.978 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/9-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.107.714 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/10-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.108.445 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/11-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.109.183 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/12-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.109.899 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/13-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.110.615 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/14-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.111.329 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/15-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.112.036 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/16-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.112.805 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/17-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.113.511 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/18-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.114.209 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/19-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.114.910 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/20-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.115.611 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/21-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.116.313 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/22-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.117.033 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/23-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.117.730 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/24-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.118.442 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/25-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.119.142 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/26-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.119.821 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/27-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.120.500 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/28-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.121.189 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/29-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.121.825 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/30-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:06.122.444 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/31-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978967,ffff87186010,python):2024-07-30-02:18:08.691.692 [mindspore/ccsrc/frontend/parallel/graph_util/graph_utils.cc:68] GetTensorRedistributionFromCNode] Default/network-MFTrainOneStepCell/clip_grad_norm-ClipGradNorm/Sqrt-op0 has no OperatorInfo. +- \ | 2024-07-30 02:26:19,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2/ 3125], loss: 1.392, per_step_time: 259709ms, lr: 3.558719e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:19,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.0% | | 0.03080 samples/s/p 28 days, 4:11:01 } +2024-07-30 02:26:23,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 4/ 3125], loss: 1.327, per_step_time: 1474ms, lr: 1.0676156e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:23,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.0% | | 5.42694 samples/s/p 3:50:14 } +2024-07-30 02:26:26,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 6/ 3125], loss: 1.193, per_step_time: 1413ms, lr: 1.7793593e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:26,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.66026 samples/s/p 3:40:41 } +2024-07-30 02:26:28,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 8/ 3125], loss: 1.399, per_step_time: 1415ms, lr: 2.4911031e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:28,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.65262 samples/s/p 3:40:56 } +2024-07-30 02:26:31,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 10/ 3125], loss: 1.360, per_step_time: 1416ms, lr: 3.202847e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:31,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.64784 samples/s/p 3:41:05 } +2024-07-30 02:26:34,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 12/ 3125], loss: 1.379, per_step_time: 1413ms, lr: 3.9145905e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:34,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.65944 samples/s/p 3:40:35 } +2024-07-30 02:26:37,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 14/ 3125], loss: 1.350, per_step_time: 1413ms, lr: 4.6263344e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:37,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.65819 samples/s/p 3:40:35 } +2024-07-30 02:26:40,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 16/ 3125], loss: 1.343, per_step_time: 1413ms, lr: 5.3380785e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:40,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.66154 samples/s/p 3:40:24 } +2024-07-30 02:26:43,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 18/ 3125], loss: 1.049, per_step_time: 1414ms, lr: 6.049822e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:43,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.65730 samples/s/p 3:40:31 } +2024-07-30 02:26:45,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 20/ 3125], loss: 1.286, per_step_time: 1413ms, lr: 6.7615656e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:45,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.66074 samples/s/p 3:40:20 } +2024-07-30 02:26:48,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 22/ 3125], loss: 1.170, per_step_time: 1413ms, lr: 7.473309e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:48,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.65794 samples/s/p 3:40:24 } +2024-07-30 02:26:51,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 24/ 3125], loss: 1.197, per_step_time: 1413ms, lr: 8.185053e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:51,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.66088 samples/s/p 3:40:14 } +2024-07-30 02:26:54,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 26/ 3125], loss: 1.367, per_step_time: 1413ms, lr: 8.896797e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:54,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.65786 samples/s/p 3:40:19 } +2024-07-30 02:26:57,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 28/ 3125], loss: 1.430, per_step_time: 1413ms, lr: 9.608541e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:57,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.65840 samples/s/p 3:40:15 } +2024-07-30 02:27:00,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 30/ 3125], loss: 1.447, per_step_time: 1413ms, lr: 1.0320284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:00,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.66161 samples/s/p 3:40:04 } +2024-07-30 02:27:02,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 32/ 3125], loss: 1.653, per_step_time: 1415ms, lr: 1.1032029e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:02,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.65352 samples/s/p 3:40:20 } +2024-07-30 02:27:05,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 34/ 3125], loss: 1.188, per_step_time: 1424ms, lr: 1.1743772e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:05,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.61451 samples/s/p 3:41:49 } +2024-07-30 02:27:08,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 36/ 3125], loss: 1.306, per_step_time: 1414ms, lr: 1.2455515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:08,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.65672 samples/s/p 3:40:07 } +2024-07-30 02:27:11,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 38/ 3125], loss: 1.332, per_step_time: 1413ms, lr: 1.3167258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:11,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.66042 samples/s/p 3:39:56 } +2024-07-30 02:27:14,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 40/ 3125], loss: 1.375, per_step_time: 1416ms, lr: 1.3879004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:14,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.64954 samples/s/p 3:40:18 } +2024-07-30 02:27:17,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 42/ 3125], loss: 1.420, per_step_time: 1413ms, lr: 1.4590747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:17,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.65881 samples/s/p 3:39:54 } +2024-07-30 02:27:19,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 44/ 3125], loss: 1.437, per_step_time: 1412ms, lr: 1.530249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:19,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.66248 samples/s/p 3:39:42 } +2024-07-30 02:27:22,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 46/ 3125], loss: 1.287, per_step_time: 1413ms, lr: 1.6014234e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:22,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.66144 samples/s/p 3:39:42 } +2024-07-30 02:27:25,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 48/ 3125], loss: 1.380, per_step_time: 1414ms, lr: 1.6725978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:25,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.65546 samples/s/p 3:39:53 } +2024-07-30 02:27:28,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 50/ 3125], loss: 1.100, per_step_time: 1413ms, lr: 1.7437721e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:28,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.65905 samples/s/p 3:39:42 } +2024-07-30 02:27:31,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 52/ 3125], loss: 1.361, per_step_time: 1413ms, lr: 1.8149465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:31,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.65896 samples/s/p 3:39:39 } +2024-07-30 02:27:34,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 54/ 3125], loss: 1.508, per_step_time: 1413ms, lr: 1.886121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:34,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.65853 samples/s/p 3:39:37 } +2024-07-30 02:27:36,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 56/ 3125], loss: 1.341, per_step_time: 1413ms, lr: 1.9572954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:36,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.66059 samples/s/p 3:39:30 } +2024-07-30 02:27:39,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 58/ 3125], loss: 1.275, per_step_time: 1413ms, lr: 2.0284697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:39,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.66066 samples/s/p 3:39:27 } +2024-07-30 02:27:42,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 60/ 3125], loss: 1.126, per_step_time: 1414ms, lr: 2.099644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:42,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.65573 samples/s/p 3:39:36 } +2024-07-30 02:27:45,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 62/ 3125], loss: 1.619, per_step_time: 1413ms, lr: 2.1708183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:45,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.65985 samples/s/p 3:39:23 } +2024-07-30 02:27:48,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 64/ 3125], loss: 1.251, per_step_time: 1415ms, lr: 2.2419927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:48,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.65213 samples/s/p 3:39:38 } +2024-07-30 02:27:51,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 66/ 3125], loss: 1.324, per_step_time: 1413ms, lr: 2.3131672e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:51,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.65944 samples/s/p 3:39:18 } +2024-07-30 02:27:53,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 68/ 3125], loss: 1.160, per_step_time: 1413ms, lr: 2.3843415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:53,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.65865 samples/s/p 3:39:17 } +2024-07-30 02:27:56,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 70/ 3125], loss: 1.056, per_step_time: 1413ms, lr: 2.4555159e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:56,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.65850 samples/s/p 3:39:15 } +2024-07-30 02:27:59,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 72/ 3125], loss: 1.486, per_step_time: 1414ms, lr: 2.5266902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:59,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.65496 samples/s/p 3:39:20 } +2024-07-30 02:28:02,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 74/ 3125], loss: 1.359, per_step_time: 1414ms, lr: 2.5978647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:02,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.65634 samples/s/p 3:39:14 } +2024-07-30 02:28:05,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 76/ 3125], loss: 1.356, per_step_time: 1415ms, lr: 2.669039e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:05,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.65248 samples/s/p 3:39:20 } +2024-07-30 02:28:08,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 78/ 3125], loss: 1.349, per_step_time: 1414ms, lr: 2.7402134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:08,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.65688 samples/s/p 3:39:07 } +2024-07-30 02:28:10,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 80/ 3125], loss: 1.630, per_step_time: 1412ms, lr: 2.8113877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:10,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.66228 samples/s/p 3:38:52 } +2024-07-30 02:28:13,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 82/ 3125], loss: 1.549, per_step_time: 1414ms, lr: 2.8825623e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:13,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.65709 samples/s/p 3:39:01 } +2024-07-30 02:28:16,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 84/ 3125], loss: 1.097, per_step_time: 1413ms, lr: 2.9537364e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:16,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.65960 samples/s/p 3:38:53 } +2024-07-30 02:28:19,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 86/ 3125], loss: 1.357, per_step_time: 1413ms, lr: 3.024911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:19,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.66110 samples/s/p 3:38:46 } +2024-07-30 02:28:22,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 88/ 3125], loss: 1.011, per_step_time: 1416ms, lr: 3.0960855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:22,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.64686 samples/s/p 3:39:17 } +2024-07-30 02:28:25,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 90/ 3125], loss: 0.990, per_step_time: 1413ms, lr: 3.1672596e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:25,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.66077 samples/s/p 3:38:41 } +2024-07-30 02:28:27,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 92/ 3125], loss: 1.119, per_step_time: 1414ms, lr: 3.2384341e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:27,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.65623 samples/s/p 3:38:49 } +2024-07-30 02:28:30,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 94/ 3125], loss: 1.152, per_step_time: 1414ms, lr: 3.3096082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:30,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.65648 samples/s/p 3:38:46 } +2024-07-30 02:28:33,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 96/ 3125], loss: 1.270, per_step_time: 1413ms, lr: 3.3807828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:33,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.65921 samples/s/p 3:38:37 } +2024-07-30 02:28:36,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 98/ 3125], loss: 1.162, per_step_time: 1414ms, lr: 3.4519574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:36,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.65456 samples/s/p 3:38:44 } +2024-07-30 02:28:39,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 100/ 3125], loss: 0.916, per_step_time: 1413ms, lr: 3.5231315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:39,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.66171 samples/s/p 3:38:25 } +2024-07-30 02:28:42,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 102/ 3125], loss: 1.030, per_step_time: 1414ms, lr: 3.594306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:42,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.65509 samples/s/p 3:38:38 } +2024-07-30 02:28:44,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 104/ 3125], loss: 1.432, per_step_time: 1414ms, lr: 3.6654803e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:44,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.65399 samples/s/p 3:38:37 } +2024-07-30 02:28:47,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 106/ 3125], loss: 1.152, per_step_time: 1413ms, lr: 3.7366547e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:47,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.66062 samples/s/p 3:38:19 } +2024-07-30 02:28:50,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 108/ 3125], loss: 1.291, per_step_time: 1413ms, lr: 3.807829e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:50,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.65889 samples/s/p 3:38:20 } +2024-07-30 02:28:53,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 110/ 3125], loss: 1.239, per_step_time: 1413ms, lr: 3.8790035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:53,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.66160 samples/s/p 3:38:11 } +2024-07-30 02:28:56,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 112/ 3125], loss: 1.071, per_step_time: 1415ms, lr: 3.950178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:56,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.65298 samples/s/p 3:38:28 } +2024-07-30 02:28:59,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 114/ 3125], loss: 1.148, per_step_time: 1413ms, lr: 4.021352e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:59,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.65913 samples/s/p 3:38:11 } +2024-07-30 02:29:02,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 116/ 3125], loss: 1.301, per_step_time: 1413ms, lr: 4.0925265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:02,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.66129 samples/s/p 3:38:03 } +2024-07-30 02:29:04,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 118/ 3125], loss: 0.982, per_step_time: 1413ms, lr: 4.163701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:04,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.65990 samples/s/p 3:38:04 } +2024-07-30 02:29:07,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 120/ 3125], loss: 1.209, per_step_time: 1414ms, lr: 4.234875e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:07,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.65687 samples/s/p 3:38:08 } +2024-07-30 02:29:10,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 122/ 3125], loss: 0.910, per_step_time: 1414ms, lr: 4.3060495e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:10,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.65613 samples/s/p 3:38:07 } +2024-07-30 02:29:13,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 124/ 3125], loss: 1.276, per_step_time: 1414ms, lr: 4.377224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:13,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.65493 samples/s/p 3:38:07 } +2024-07-30 02:29:16,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 126/ 3125], loss: 1.127, per_step_time: 1413ms, lr: 4.4483986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:16,178 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.65782 samples/s/p 3:37:57 } +2024-07-30 02:29:19,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 128/ 3125], loss: 0.940, per_step_time: 1413ms, lr: 4.519573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:19,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.65857 samples/s/p 3:37:53 } +2024-07-30 02:29:21,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 130/ 3125], loss: 1.026, per_step_time: 1413ms, lr: 4.5907473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:21,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.65910 samples/s/p 3:37:49 } +2024-07-30 02:29:24,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 132/ 3125], loss: 0.990, per_step_time: 1414ms, lr: 4.6619216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:24,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.65721 samples/s/p 3:37:50 } +2024-07-30 02:29:27,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 134/ 3125], loss: 1.413, per_step_time: 1413ms, lr: 4.733096e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:27,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.65855 samples/s/p 3:37:44 } +2024-07-30 02:29:30,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 136/ 3125], loss: 1.120, per_step_time: 1413ms, lr: 4.8042702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:30,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.65851 samples/s/p 3:37:42 } +2024-07-30 02:29:33,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 138/ 3125], loss: 0.952, per_step_time: 1415ms, lr: 4.8754446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:33,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.65355 samples/s/p 3:37:50 } +2024-07-30 02:29:36,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 140/ 3125], loss: 1.111, per_step_time: 1413ms, lr: 4.9466194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:36,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.65796 samples/s/p 3:37:37 } +2024-07-30 02:29:38,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 142/ 3125], loss: 1.099, per_step_time: 1414ms, lr: 5.0177937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:38,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.65587 samples/s/p 3:37:39 } +2024-07-30 02:29:41,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 144/ 3125], loss: 1.208, per_step_time: 1414ms, lr: 5.0889676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:41,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.65707 samples/s/p 3:37:34 } +2024-07-30 02:29:44,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 146/ 3125], loss: 1.044, per_step_time: 1413ms, lr: 5.160142e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:44,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.66129 samples/s/p 3:37:21 } +2024-07-30 02:29:47,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 148/ 3125], loss: 1.002, per_step_time: 1413ms, lr: 5.2313167e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:47,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.66068 samples/s/p 3:37:20 } +2024-07-30 02:29:50,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 150/ 3125], loss: 1.366, per_step_time: 1413ms, lr: 5.302491e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:50,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.66082 samples/s/p 3:37:16 } +2024-07-30 02:29:53,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 152/ 3125], loss: 0.954, per_step_time: 1413ms, lr: 5.3736658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:53,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.66132 samples/s/p 3:37:13 } +2024-07-30 02:29:55,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 154/ 3125], loss: 0.976, per_step_time: 1413ms, lr: 5.4448396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:55,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.66013 samples/s/p 3:37:12 } +2024-07-30 02:29:58,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 156/ 3125], loss: 1.448, per_step_time: 1415ms, lr: 5.516014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:58,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.65360 samples/s/p 3:37:25 } +2024-07-30 02:30:01,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 158/ 3125], loss: 1.134, per_step_time: 1413ms, lr: 5.5871883e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:01,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.65955 samples/s/p 3:37:08 } +2024-07-30 02:30:04,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 160/ 3125], loss: 1.046, per_step_time: 1413ms, lr: 5.658363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:04,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.65897 samples/s/p 3:37:07 } +2024-07-30 02:30:07,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 162/ 3125], loss: 1.002, per_step_time: 1414ms, lr: 5.7295374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:07,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.65490 samples/s/p 3:37:13 } +2024-07-30 02:30:10,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 164/ 3125], loss: 0.902, per_step_time: 1412ms, lr: 5.8007113e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:10,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.66209 samples/s/p 3:36:54 } +2024-07-30 02:30:12,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 166/ 3125], loss: 1.278, per_step_time: 1413ms, lr: 5.871886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:12,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.65937 samples/s/p 3:36:57 } +2024-07-30 02:30:15,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 168/ 3125], loss: 0.935, per_step_time: 1415ms, lr: 5.9430604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:15,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.65270 samples/s/p 3:37:10 } +2024-07-30 02:30:18,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 170/ 3125], loss: 0.847, per_step_time: 1413ms, lr: 6.0142347e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:18,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.65864 samples/s/p 3:36:53 } +2024-07-30 02:30:21,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 172/ 3125], loss: 0.977, per_step_time: 1413ms, lr: 6.0854086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:21,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.66026 samples/s/p 3:36:47 } +2024-07-30 02:30:24,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 174/ 3125], loss: 1.147, per_step_time: 1413ms, lr: 6.1565834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:24,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.66072 samples/s/p 3:36:43 } +2024-07-30 02:30:27,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 176/ 3125], loss: 0.650, per_step_time: 1413ms, lr: 6.2277577e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:27,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.66089 samples/s/p 3:36:40 } +2024-07-30 02:30:29,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 178/ 3125], loss: 0.672, per_step_time: 1413ms, lr: 6.2989325e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:29,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.65869 samples/s/p 3:36:42 } +2024-07-30 02:30:32,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 180/ 3125], loss: 0.873, per_step_time: 1413ms, lr: 6.370107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:32,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.66060 samples/s/p 3:36:35 } +2024-07-30 02:30:35,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 182/ 3125], loss: 1.075, per_step_time: 1416ms, lr: 6.4412807e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:35,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.64730 samples/s/p 3:37:02 } +2024-07-30 02:30:38,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 184/ 3125], loss: 0.945, per_step_time: 1413ms, lr: 6.512455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:38,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% | | 5.65788 samples/s/p 3:36:35 } +2024-07-30 02:30:41,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 186/ 3125], loss: 0.759, per_step_time: 1415ms, lr: 6.58363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:41,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% | | 5.65079 samples/s/p 3:36:49 } +2024-07-30 02:30:44,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 188/ 3125], loss: 0.980, per_step_time: 1413ms, lr: 6.654804e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:44,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.66079 samples/s/p 3:36:23 } +2024-07-30 02:30:46,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 190/ 3125], loss: 1.129, per_step_time: 1413ms, lr: 6.725979e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:46,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.66104 samples/s/p 3:36:19 } +2024-07-30 02:30:49,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 192/ 3125], loss: 0.925, per_step_time: 1413ms, lr: 6.7971528e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:49,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.65904 samples/s/p 3:36:21 } +2024-07-30 02:30:52,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 194/ 3125], loss: 0.785, per_step_time: 1413ms, lr: 6.868327e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:52,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.66036 samples/s/p 3:36:15 } +2024-07-30 02:30:55,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 196/ 3125], loss: 1.030, per_step_time: 1413ms, lr: 6.9395014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:55,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.66146 samples/s/p 3:36:10 } +2024-07-30 02:30:58,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 198/ 3125], loss: 0.733, per_step_time: 1413ms, lr: 7.010676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:58,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.65932 samples/s/p 3:36:12 } +2024-07-30 02:31:01,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 200/ 3125], loss: 0.688, per_step_time: 1414ms, lr: 7.0818505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:01,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.65436 samples/s/p 3:36:21 } +2024-07-30 02:31:03,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 202/ 3125], loss: 0.663, per_step_time: 1413ms, lr: 7.1530244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:03,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.65829 samples/s/p 3:36:09 } +2024-07-30 02:31:06,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 204/ 3125], loss: 0.988, per_step_time: 1414ms, lr: 7.224199e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:06,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.65463 samples/s/p 3:36:14 } +2024-07-30 02:31:09,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 206/ 3125], loss: 1.034, per_step_time: 1413ms, lr: 7.2953735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:09,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.65841 samples/s/p 3:36:03 } +2024-07-30 02:31:12,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 208/ 3125], loss: 0.978, per_step_time: 1414ms, lr: 7.366548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:12,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.65556 samples/s/p 3:36:07 } +2024-07-30 02:31:15,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 210/ 3125], loss: 0.827, per_step_time: 1413ms, lr: 7.4377217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:15,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.66071 samples/s/p 3:35:52 } +2024-07-30 02:31:18,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 212/ 3125], loss: 0.735, per_step_time: 1413ms, lr: 7.5088965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:18,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.65874 samples/s/p 3:35:54 } +2024-07-30 02:31:20,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 214/ 3125], loss: 0.890, per_step_time: 1414ms, lr: 7.580071e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:20,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.65523 samples/s/p 3:35:59 } +2024-07-30 02:31:23,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 216/ 3125], loss: 0.707, per_step_time: 1413ms, lr: 7.651245e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:23,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.66112 samples/s/p 3:35:43 } +2024-07-30 02:31:26,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 218/ 3125], loss: 0.747, per_step_time: 1413ms, lr: 7.7224195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:26,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.65798 samples/s/p 3:35:47 } +2024-07-30 02:31:29,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 220/ 3125], loss: 0.692, per_step_time: 1413ms, lr: 7.793594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:29,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.65944 samples/s/p 3:35:41 } +2024-07-30 02:31:32,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 222/ 3125], loss: 0.531, per_step_time: 1413ms, lr: 7.864768e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:32,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.65955 samples/s/p 3:35:38 } +2024-07-30 02:31:35,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 224/ 3125], loss: 0.898, per_step_time: 1415ms, lr: 7.935942e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:35,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.65123 samples/s/p 3:35:54 } +2024-07-30 02:31:37,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 226/ 3125], loss: 0.747, per_step_time: 1412ms, lr: 8.007118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:37,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.66247 samples/s/p 3:35:25 } +2024-07-30 02:31:40,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 228/ 3125], loss: 0.643, per_step_time: 1413ms, lr: 8.078292e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:40,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.66018 samples/s/p 3:35:28 } +2024-07-30 02:31:43,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 230/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 8.149465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:43,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.65877 samples/s/p 3:35:28 } +2024-07-30 02:31:46,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 232/ 3125], loss: 0.616, per_step_time: 1413ms, lr: 8.220641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:46,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.66042 samples/s/p 3:35:22 } +2024-07-30 02:31:49,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 234/ 3125], loss: 0.555, per_step_time: 1413ms, lr: 8.291815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:49,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.66034 samples/s/p 3:35:19 } +2024-07-30 02:31:52,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 236/ 3125], loss: 0.715, per_step_time: 1412ms, lr: 8.362989e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:52,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.66177 samples/s/p 3:35:13 } +2024-07-30 02:31:54,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 238/ 3125], loss: 0.645, per_step_time: 1413ms, lr: 8.434164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:54,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.65948 samples/s/p 3:35:15 } +2024-07-30 02:31:57,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 240/ 3125], loss: 0.602, per_step_time: 1413ms, lr: 8.505338e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:57,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.66050 samples/s/p 3:35:10 } +2024-07-30 02:32:00,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 242/ 3125], loss: 0.831, per_step_time: 1413ms, lr: 8.576512e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:00,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.66009 samples/s/p 3:35:08 } +2024-07-30 02:32:03,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 244/ 3125], loss: 0.463, per_step_time: 1413ms, lr: 8.647687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:03,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.65903 samples/s/p 3:35:08 } +2024-07-30 02:32:06,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 246/ 3125], loss: 0.654, per_step_time: 1413ms, lr: 8.718861e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:06,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.65808 samples/s/p 3:35:07 } +2024-07-30 02:32:09,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 248/ 3125], loss: 0.650, per_step_time: 1413ms, lr: 8.790035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:09,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.65998 samples/s/p 3:35:00 } +2024-07-30 02:32:11,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 250/ 3125], loss: 0.783, per_step_time: 1414ms, lr: 8.86121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:11,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.65421 samples/s/p 3:35:10 } +2024-07-30 02:32:14,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 252/ 3125], loss: 0.595, per_step_time: 1414ms, lr: 8.932384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:14,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.65685 samples/s/p 3:35:01 } +2024-07-30 02:32:17,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 254/ 3125], loss: 0.493, per_step_time: 1414ms, lr: 9.003558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:17,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.65676 samples/s/p 3:34:59 } +2024-07-30 02:32:20,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 256/ 3125], loss: 0.632, per_step_time: 1412ms, lr: 9.074733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:20,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.66268 samples/s/p 3:34:42 } +2024-07-30 02:32:23,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 258/ 3125], loss: 0.473, per_step_time: 1413ms, lr: 9.145907e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:23,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.65845 samples/s/p 3:34:49 } +2024-07-30 02:32:26,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 260/ 3125], loss: 0.446, per_step_time: 1413ms, lr: 9.217081e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:26,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.65927 samples/s/p 3:34:45 } +2024-07-30 02:32:28,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 262/ 3125], loss: 0.413, per_step_time: 1413ms, lr: 9.288256e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:28,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.65996 samples/s/p 3:34:40 } +2024-07-30 02:32:31,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 264/ 3125], loss: 0.407, per_step_time: 1413ms, lr: 9.359431e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:31,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.65905 samples/s/p 3:34:39 } +2024-07-30 02:32:34,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 266/ 3125], loss: 0.649, per_step_time: 1413ms, lr: 9.430605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:34,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.65851 samples/s/p 3:34:38 } +2024-07-30 02:32:37,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 268/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 9.501779e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:37,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.65616 samples/s/p 3:34:40 } +2024-07-30 02:32:40,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 270/ 3125], loss: 0.578, per_step_time: 1413ms, lr: 9.572954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:40,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.65849 samples/s/p 3:34:32 } +2024-07-30 02:32:43,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 272/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 9.644128e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:43,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.66161 samples/s/p 3:34:22 } +2024-07-30 02:32:45,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 274/ 3125], loss: 0.552, per_step_time: 1413ms, lr: 9.715302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:45,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.66170 samples/s/p 3:34:19 } +2024-07-30 02:32:48,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 276/ 3125], loss: 0.565, per_step_time: 1413ms, lr: 9.786476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:48,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.66118 samples/s/p 3:34:18 } +2024-07-30 02:32:51,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 278/ 3125], loss: 0.510, per_step_time: 1412ms, lr: 9.857651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:51,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.66266 samples/s/p 3:34:11 } +2024-07-30 02:32:54,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 280/ 3125], loss: 0.584, per_step_time: 1413ms, lr: 9.928825e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:54,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.66136 samples/s/p 3:34:12 } +2024-07-30 02:32:57,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 282/ 3125], loss: 0.441, per_step_time: 1413ms, lr: 1e-05, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:57,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.66004 samples/s/p 3:34:12 } +2024-07-30 02:33:00,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 284/ 3125], loss: 0.723, per_step_time: 1413ms, lr: 9.999999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:00,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.66161 samples/s/p 3:34:05 } +2024-07-30 02:33:02,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 286/ 3125], loss: 0.547, per_step_time: 1413ms, lr: 9.999995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:02,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.65911 samples/s/p 3:34:08 } +2024-07-30 02:33:05,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 288/ 3125], loss: 0.553, per_step_time: 1413ms, lr: 9.999989e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:05,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.65990 samples/s/p 3:34:04 } +2024-07-30 02:33:08,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 290/ 3125], loss: 0.653, per_step_time: 1413ms, lr: 9.999981e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:08,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.66067 samples/s/p 3:33:59 } +2024-07-30 02:33:11,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 292/ 3125], loss: 0.515, per_step_time: 1413ms, lr: 9.99997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:11,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.66156 samples/s/p 3:33:54 } +2024-07-30 02:33:14,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 294/ 3125], loss: 0.442, per_step_time: 1413ms, lr: 9.999957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:14,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.66079 samples/s/p 3:33:53 } +2024-07-30 02:33:17,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 296/ 3125], loss: 0.624, per_step_time: 1413ms, lr: 9.9999415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:17,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.65846 samples/s/p 3:33:55 } +2024-07-30 02:33:19,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 298/ 3125], loss: 0.522, per_step_time: 1413ms, lr: 9.999923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:19,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.66035 samples/s/p 3:33:48 } +2024-07-30 02:33:22,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 300/ 3125], loss: 0.537, per_step_time: 1414ms, lr: 9.999903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:22,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.65479 samples/s/p 3:33:58 } +2024-07-30 02:33:25,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 302/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 9.999881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:25,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.65788 samples/s/p 3:33:48 } +2024-07-30 02:33:28,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 304/ 3125], loss: 0.175, per_step_time: 1414ms, lr: 9.999855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:28,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.65536 samples/s/p 3:33:51 } +2024-07-30 02:33:31,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 306/ 3125], loss: 0.318, per_step_time: 1412ms, lr: 9.999828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:31,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.66205 samples/s/p 3:33:33 } +2024-07-30 02:33:34,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 308/ 3125], loss: 0.612, per_step_time: 1413ms, lr: 9.999798e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:34,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.65939 samples/s/p 3:33:36 } +2024-07-30 02:33:36,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 310/ 3125], loss: 0.388, per_step_time: 1413ms, lr: 9.999765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:36,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.65985 samples/s/p 3:33:33 } +2024-07-30 02:33:39,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 312/ 3125], loss: 0.609, per_step_time: 1413ms, lr: 9.9997305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:39,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.66046 samples/s/p 3:33:28 } +2024-07-30 02:33:42,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 314/ 3125], loss: 0.541, per_step_time: 1413ms, lr: 9.999694e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:42,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.65778 samples/s/p 3:33:32 } +2024-07-30 02:33:45,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 316/ 3125], loss: 0.526, per_step_time: 1413ms, lr: 9.999654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:45,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.65864 samples/s/p 3:33:27 } +2024-07-30 02:33:48,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 318/ 3125], loss: 0.440, per_step_time: 1413ms, lr: 9.999613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:48,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.66053 samples/s/p 3:33:20 } +2024-07-30 02:33:51,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 320/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 9.999569e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:51,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.66029 samples/s/p 3:33:17 } +2024-07-30 02:33:53,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 322/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 9.999521e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:53,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.66009 samples/s/p 3:33:15 } +2024-07-30 02:33:56,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 324/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 9.999473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:56,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.65954 samples/s/p 3:33:13 } +2024-07-30 02:33:59,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 326/ 3125], loss: 0.508, per_step_time: 1415ms, lr: 9.999422e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:59,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.65297 samples/s/p 3:33:26 } +2024-07-30 02:34:02,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 328/ 3125], loss: 0.454, per_step_time: 1414ms, lr: 9.999369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:02,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.65769 samples/s/p 3:33:12 } +2024-07-30 02:34:05,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 330/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 9.999312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:05,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.66020 samples/s/p 3:33:03 } +2024-07-30 02:34:08,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 332/ 3125], loss: 0.287, per_step_time: 1414ms, lr: 9.999253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:08,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.65592 samples/s/p 3:33:10 } +2024-07-30 02:34:10,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 334/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 9.999193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:10,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.65990 samples/s/p 3:32:59 } +2024-07-30 02:34:13,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 336/ 3125], loss: 0.487, per_step_time: 1412ms, lr: 9.99913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:13,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.66274 samples/s/p 3:32:49 } +2024-07-30 02:34:16,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 338/ 3125], loss: 0.379, per_step_time: 1413ms, lr: 9.999064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:16,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.65944 samples/s/p 3:32:54 } +2024-07-30 02:34:19,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 340/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 9.998996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:19,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.66074 samples/s/p 3:32:48 } +2024-07-30 02:34:22,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 342/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 9.998925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:22,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.65903 samples/s/p 3:32:49 } +2024-07-30 02:34:25,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 344/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 9.998853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:25,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.65952 samples/s/p 3:32:45 } +2024-07-30 02:34:27,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 346/ 3125], loss: 0.434, per_step_time: 1412ms, lr: 9.998778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:27,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.66257 samples/s/p 3:32:36 } +2024-07-30 02:34:30,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 348/ 3125], loss: 0.441, per_step_time: 1413ms, lr: 9.9987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:30,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.66025 samples/s/p 3:32:38 } +2024-07-30 02:34:33,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 350/ 3125], loss: 0.393, per_step_time: 1416ms, lr: 9.99862e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:33,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.64720 samples/s/p 3:33:05 } +2024-07-30 02:34:36,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 352/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 9.998537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:36,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.65780 samples/s/p 3:32:38 } +2024-07-30 02:34:39,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 354/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 9.998453e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:39,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.66083 samples/s/p 3:32:28 } +2024-07-30 02:34:42,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 356/ 3125], loss: 0.453, per_step_time: 1413ms, lr: 9.998366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:42,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.65880 samples/s/p 3:32:30 } +2024-07-30 02:34:45,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 358/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 9.998276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:45,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.66000 samples/s/p 3:32:24 } +2024-07-30 02:34:47,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 360/ 3125], loss: 0.478, per_step_time: 1414ms, lr: 9.998184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:47,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.65706 samples/s/p 3:32:28 } +2024-07-30 02:34:50,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 362/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 9.99809e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:50,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.65900 samples/s/p 3:32:21 } +2024-07-30 02:34:53,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 364/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 9.997993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:53,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.66042 samples/s/p 3:32:15 } +2024-07-30 02:34:56,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 366/ 3125], loss: 0.439, per_step_time: 1413ms, lr: 9.997894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:56,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.65993 samples/s/p 3:32:13 } +2024-07-30 02:34:59,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 368/ 3125], loss: 0.439, per_step_time: 1412ms, lr: 9.997793e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:59,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.66218 samples/s/p 3:32:05 } +2024-07-30 02:35:02,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 370/ 3125], loss: 0.284, per_step_time: 1425ms, lr: 9.99769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:02,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.61136 samples/s/p 3:33:58 } +2024-07-30 02:35:04,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 372/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 9.997583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:04,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |█ | 5.65994 samples/s/p 3:32:05 } +2024-07-30 02:35:07,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 374/ 3125], loss: 0.374, per_step_time: 1414ms, lr: 9.997474e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:07,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |█ | 5.65477 samples/s/p 3:32:14 } +2024-07-30 02:35:10,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 376/ 3125], loss: 0.395, per_step_time: 1412ms, lr: 9.997363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:10,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.66181 samples/s/p 3:31:55 } +2024-07-30 02:35:13,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 378/ 3125], loss: 0.303, per_step_time: 1414ms, lr: 9.997249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:13,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.65755 samples/s/p 3:32:02 } +2024-07-30 02:35:16,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 380/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 9.997134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:16,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.65847 samples/s/p 3:31:57 } +2024-07-30 02:35:19,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 382/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 9.997016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:19,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.65774 samples/s/p 3:31:56 } +2024-07-30 02:35:21,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 384/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 9.996896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:21,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.65775 samples/s/p 3:31:53 } +2024-07-30 02:35:24,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 386/ 3125], loss: 0.075, per_step_time: 1414ms, lr: 9.996773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:24,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.65713 samples/s/p 3:31:51 } +2024-07-30 02:35:27,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 388/ 3125], loss: 0.596, per_step_time: 1413ms, lr: 9.996647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:27,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.65819 samples/s/p 3:31:46 } +2024-07-30 02:35:30,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 390/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 9.996519e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:30,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.66132 samples/s/p 3:31:36 } +2024-07-30 02:35:33,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 392/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 9.996389e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:33,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.66115 samples/s/p 3:31:34 } +2024-07-30 02:35:36,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 394/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 9.996256e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:36,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.66025 samples/s/p 3:31:33 } +2024-07-30 02:35:38,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 396/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 9.996122e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:38,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.66020 samples/s/p 3:31:30 } +2024-07-30 02:35:41,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 398/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 9.995984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:41,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.65801 samples/s/p 3:31:32 } +2024-07-30 02:35:44,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 400/ 3125], loss: 0.145, per_step_time: 1414ms, lr: 9.995845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:44,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.65652 samples/s/p 3:31:33 } +2024-07-30 02:35:47,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 402/ 3125], loss: 0.443, per_step_time: 1413ms, lr: 9.995703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:47,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.65942 samples/s/p 3:31:23 } +2024-07-30 02:35:50,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 404/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 9.995558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:50,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.66105 samples/s/p 3:31:17 } +2024-07-30 02:35:53,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 406/ 3125], loss: 0.283, per_step_time: 1414ms, lr: 9.995412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:53,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.65739 samples/s/p 3:31:22 } +2024-07-30 02:35:55,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 408/ 3125], loss: 0.248, per_step_time: 1414ms, lr: 9.995262e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:55,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.65740 samples/s/p 3:31:20 } +2024-07-30 02:35:58,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 410/ 3125], loss: 0.428, per_step_time: 1413ms, lr: 9.995111e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:58,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.65926 samples/s/p 3:31:13 } +2024-07-30 02:36:01,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 412/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 9.994957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:01,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.65947 samples/s/p 3:31:09 } +2024-07-30 02:36:04,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 414/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 9.994801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:04,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.66024 samples/s/p 3:31:05 } +2024-07-30 02:36:07,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 416/ 3125], loss: 0.382, per_step_time: 1414ms, lr: 9.994643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:07,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.65767 samples/s/p 3:31:08 } +2024-07-30 02:36:10,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 418/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 9.994482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:10,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.66009 samples/s/p 3:30:59 } +2024-07-30 02:36:12,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 420/ 3125], loss: 0.203, per_step_time: 1412ms, lr: 9.994317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:12,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.66257 samples/s/p 3:30:51 } +2024-07-30 02:36:15,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 422/ 3125], loss: 0.357, per_step_time: 1413ms, lr: 9.994152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:15,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.65785 samples/s/p 3:30:59 } +2024-07-30 02:36:18,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 424/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 9.993983e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:18,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.66043 samples/s/p 3:30:50 } +2024-07-30 02:36:21,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 426/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 9.9938125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:21,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.66153 samples/s/p 3:30:45 } +2024-07-30 02:36:24,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 428/ 3125], loss: 0.408, per_step_time: 1413ms, lr: 9.99364e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:24,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.66163 samples/s/p 3:30:42 } +2024-07-30 02:36:27,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 430/ 3125], loss: 0.458, per_step_time: 1413ms, lr: 9.993465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:27,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.65914 samples/s/p 3:30:45 } +2024-07-30 02:36:29,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 432/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 9.993287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:29,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.65786 samples/s/p 3:30:45 } +2024-07-30 02:36:32,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 434/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 9.993107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:32,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.65967 samples/s/p 3:30:38 } +2024-07-30 02:36:35,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 436/ 3125], loss: 0.404, per_step_time: 1414ms, lr: 9.992924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:35,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.65678 samples/s/p 3:30:41 } +2024-07-30 02:36:38,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 438/ 3125], loss: 0.274, per_step_time: 1414ms, lr: 9.992738e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:38,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.65743 samples/s/p 3:30:37 } +2024-07-30 02:36:41,231 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 440/ 3125], loss: 0.661, per_step_time: 1413ms, lr: 9.992552e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:41,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.66099 samples/s/p 3:30:26 } +2024-07-30 02:36:44,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 442/ 3125], loss: 0.255, per_step_time: 1416ms, lr: 9.992362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:44,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.64739 samples/s/p 3:30:54 } +2024-07-30 02:36:46,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 444/ 3125], loss: 0.383, per_step_time: 1413ms, lr: 9.99217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:46,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.65935 samples/s/p 3:30:24 } +2024-07-30 02:36:49,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 446/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 9.991976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:49,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.66011 samples/s/p 3:30:20 } +2024-07-30 02:36:52,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 448/ 3125], loss: 0.331, per_step_time: 1415ms, lr: 9.991779e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:52,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.65352 samples/s/p 3:30:32 } +2024-07-30 02:36:55,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 450/ 3125], loss: 0.209, per_step_time: 1412ms, lr: 9.99158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:55,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.66310 samples/s/p 3:30:07 } +2024-07-30 02:36:58,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 452/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 9.991378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:58,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.66019 samples/s/p 3:30:11 } +2024-07-30 02:37:01,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 454/ 3125], loss: 0.512, per_step_time: 1414ms, lr: 9.991173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:01,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.65760 samples/s/p 3:30:14 } +2024-07-30 02:37:03,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 456/ 3125], loss: 0.390, per_step_time: 1414ms, lr: 9.990968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:03,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.65580 samples/s/p 3:30:15 } +2024-07-30 02:37:06,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 458/ 3125], loss: 0.349, per_step_time: 1414ms, lr: 9.990758e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:06,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.65724 samples/s/p 3:30:09 } +2024-07-30 02:37:09,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 460/ 3125], loss: 0.634, per_step_time: 1412ms, lr: 9.990547e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:09,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.66273 samples/s/p 3:29:54 } +2024-07-30 02:37:12,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 462/ 3125], loss: 0.333, per_step_time: 1412ms, lr: 9.990334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:12,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.66178 samples/s/p 3:29:53 } +2024-07-30 02:37:15,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 464/ 3125], loss: 0.291, per_step_time: 1414ms, lr: 9.990118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:15,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.65504 samples/s/p 3:30:06 } +2024-07-30 02:37:18,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 466/ 3125], loss: 0.124, per_step_time: 1413ms, lr: 9.9899e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:18,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.66025 samples/s/p 3:29:51 } +2024-07-30 02:37:20,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 468/ 3125], loss: 0.193, per_step_time: 1412ms, lr: 9.98968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:20,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.66192 samples/s/p 3:29:45 } +2024-07-30 02:37:23,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 470/ 3125], loss: 0.148, per_step_time: 1413ms, lr: 9.989456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:23,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.66128 samples/s/p 3:29:43 } +2024-07-30 02:37:26,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 472/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 9.98923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:26,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.65893 samples/s/p 3:29:46 } +2024-07-30 02:37:29,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 474/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 9.989003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:29,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.65995 samples/s/p 3:29:41 } +2024-07-30 02:37:32,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 476/ 3125], loss: 0.678, per_step_time: 1413ms, lr: 9.988773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:32,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.66038 samples/s/p 3:29:37 } +2024-07-30 02:37:35,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 478/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 9.98854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:35,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.66154 samples/s/p 3:29:31 } +2024-07-30 02:37:37,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 480/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 9.9883055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:37,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.65895 samples/s/p 3:29:34 } +2024-07-30 02:37:40,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 482/ 3125], loss: 0.129, per_step_time: 1414ms, lr: 9.988068e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:40,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.65680 samples/s/p 3:29:36 } +2024-07-30 02:37:43,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 484/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 9.987828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:43,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.65968 samples/s/p 3:29:27 } +2024-07-30 02:37:46,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 486/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 9.987586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:46,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.65829 samples/s/p 3:29:27 } +2024-07-30 02:37:49,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 488/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 9.987341e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:49,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.65938 samples/s/p 3:29:22 } +2024-07-30 02:37:52,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 490/ 3125], loss: 0.480, per_step_time: 1413ms, lr: 9.987094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:52,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.66150 samples/s/p 3:29:14 } +2024-07-30 02:37:54,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 492/ 3125], loss: 0.380, per_step_time: 1413ms, lr: 9.986845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:54,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.65863 samples/s/p 3:29:18 } +2024-07-30 02:37:57,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 494/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 9.986594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:57,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.65773 samples/s/p 3:29:17 } +2024-07-30 02:38:00,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 496/ 3125], loss: 0.252, per_step_time: 1414ms, lr: 9.986339e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:00,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.65765 samples/s/p 3:29:15 } +2024-07-30 02:38:03,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 498/ 3125], loss: 0.270, per_step_time: 1414ms, lr: 9.986084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:03,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.65704 samples/s/p 3:29:13 } +2024-07-30 02:38:06,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 500/ 3125], loss: 0.292, per_step_time: 1414ms, lr: 9.985824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:06,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.65729 samples/s/p 3:29:10 } +2024-07-30 02:38:09,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 502/ 3125], loss: 0.396, per_step_time: 1413ms, lr: 9.985563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:09,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.66048 samples/s/p 3:29:00 } +2024-07-30 02:38:11,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 504/ 3125], loss: 0.282, per_step_time: 1412ms, lr: 9.9853005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:11,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.66317 samples/s/p 3:28:51 } +2024-07-30 02:38:14,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 506/ 3125], loss: 0.261, per_step_time: 1414ms, lr: 9.985034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:14,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.65656 samples/s/p 3:29:03 } +2024-07-30 02:38:17,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 508/ 3125], loss: 0.528, per_step_time: 1413ms, lr: 9.984766e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:17,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.66136 samples/s/p 3:28:49 } +2024-07-30 02:38:20,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 510/ 3125], loss: 0.415, per_step_time: 1413ms, lr: 9.984494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:20,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.65822 samples/s/p 3:28:53 } +2024-07-30 02:38:23,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 512/ 3125], loss: 0.172, per_step_time: 1415ms, lr: 9.984221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:23,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.65340 samples/s/p 3:29:01 } +2024-07-30 02:38:26,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 514/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 9.983946e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:26,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.66004 samples/s/p 3:28:44 } +2024-07-30 02:38:28,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 516/ 3125], loss: 0.139, per_step_time: 1412ms, lr: 9.983668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:28,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.66183 samples/s/p 3:28:37 } +2024-07-30 02:38:31,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 518/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 9.983388e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:31,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.66023 samples/s/p 3:28:38 } +2024-07-30 02:38:34,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 520/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 9.983105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:34,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.65954 samples/s/p 3:28:36 } +2024-07-30 02:38:37,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 522/ 3125], loss: 0.416, per_step_time: 1413ms, lr: 9.98282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:37,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.65930 samples/s/p 3:28:34 } +2024-07-30 02:38:40,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 524/ 3125], loss: 0.506, per_step_time: 1413ms, lr: 9.982533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:40,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.66089 samples/s/p 3:28:28 } +2024-07-30 02:38:43,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 526/ 3125], loss: 0.324, per_step_time: 1412ms, lr: 9.982244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:43,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.66249 samples/s/p 3:28:21 } +2024-07-30 02:38:45,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 528/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 9.981952e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:45,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.66151 samples/s/p 3:28:21 } +2024-07-30 02:38:48,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 530/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 9.981657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:48,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.66164 samples/s/p 3:28:18 } +2024-07-30 02:38:51,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 532/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 9.981361e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:51,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.66132 samples/s/p 3:28:16 } +2024-07-30 02:38:54,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 534/ 3125], loss: 0.335, per_step_time: 1413ms, lr: 9.981061e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:54,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.66037 samples/s/p 3:28:15 } +2024-07-30 02:38:57,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 536/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 9.980759e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:57,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.66167 samples/s/p 3:28:09 } +2024-07-30 02:39:00,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 538/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 9.980456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:00,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.66127 samples/s/p 3:28:07 } +2024-07-30 02:39:02,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 540/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 9.980149e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:02,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.66047 samples/s/p 3:28:06 } +2024-07-30 02:39:05,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 542/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 9.97984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:05,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.66026 samples/s/p 3:28:04 } +2024-07-30 02:39:08,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 544/ 3125], loss: 0.380, per_step_time: 1413ms, lr: 9.979529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:08,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.65786 samples/s/p 3:28:06 } +2024-07-30 02:39:11,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 546/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 9.979216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:11,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.65477 samples/s/p 3:28:10 } +2024-07-30 02:39:14,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 548/ 3125], loss: 0.353, per_step_time: 1414ms, lr: 9.9788995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:14,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.65697 samples/s/p 3:28:03 } +2024-07-30 02:39:17,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 550/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 9.978581e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:17,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.65914 samples/s/p 3:27:55 } +2024-07-30 02:39:19,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 552/ 3125], loss: 0.391, per_step_time: 1415ms, lr: 9.978261e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:19,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.65261 samples/s/p 3:28:06 } +2024-07-30 02:39:22,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 554/ 3125], loss: 0.214, per_step_time: 1414ms, lr: 9.977938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:22,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.65715 samples/s/p 3:27:54 } +2024-07-30 02:39:25,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 556/ 3125], loss: 0.356, per_step_time: 1413ms, lr: 9.9776125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:25,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.66054 samples/s/p 3:27:43 } +2024-07-30 02:39:28,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 558/ 3125], loss: 0.101, per_step_time: 1413ms, lr: 9.977284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:28,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.66045 samples/s/p 3:27:41 } +2024-07-30 02:39:31,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 560/ 3125], loss: 0.340, per_step_time: 1412ms, lr: 9.976954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:31,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.66210 samples/s/p 3:27:34 } +2024-07-30 02:39:34,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 562/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 9.976621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:34,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.66019 samples/s/p 3:27:36 } +2024-07-30 02:39:36,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 564/ 3125], loss: 0.431, per_step_time: 1413ms, lr: 9.976287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:36,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |███ | 5.66146 samples/s/p 3:27:30 } +2024-07-30 02:39:39,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 566/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 9.97595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:39,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |███ | 5.65993 samples/s/p 3:27:31 } +2024-07-30 02:39:42,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 568/ 3125], loss: 0.368, per_step_time: 1412ms, lr: 9.97561e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:42,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.66219 samples/s/p 3:27:23 } +2024-07-30 02:39:45,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 570/ 3125], loss: 0.296, per_step_time: 1414ms, lr: 9.975269e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:45,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.65511 samples/s/p 3:27:35 } +2024-07-30 02:39:48,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 572/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 9.974923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:48,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.65969 samples/s/p 3:27:23 } +2024-07-30 02:39:51,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 574/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 9.974578e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:51,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.65891 samples/s/p 3:27:21 } +2024-07-30 02:39:53,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 576/ 3125], loss: 0.225, per_step_time: 1414ms, lr: 9.974228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:53,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.65587 samples/s/p 3:27:25 } +2024-07-30 02:39:56,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 578/ 3125], loss: 0.401, per_step_time: 1414ms, lr: 9.973876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:56,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.65703 samples/s/p 3:27:20 } +2024-07-30 02:39:59,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 580/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 9.9735225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:59,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.66130 samples/s/p 3:27:08 } +2024-07-30 02:40:02,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 582/ 3125], loss: 0.161, per_step_time: 1414ms, lr: 9.973166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:02,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.65689 samples/s/p 3:27:15 } +2024-07-30 02:40:05,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 584/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 9.972808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:05,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.66123 samples/s/p 3:27:02 } +2024-07-30 02:40:08,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 586/ 3125], loss: 0.246, per_step_time: 1412ms, lr: 9.972447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:08,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.66242 samples/s/p 3:26:57 } +2024-07-30 02:40:10,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 588/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 9.972084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:10,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.65827 samples/s/p 3:27:03 } +2024-07-30 02:40:13,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 590/ 3125], loss: 0.234, per_step_time: 1412ms, lr: 9.971717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:13,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.66171 samples/s/p 3:26:53 } +2024-07-30 02:40:16,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 592/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 9.971349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:16,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.65959 samples/s/p 3:26:55 } +2024-07-30 02:40:19,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 594/ 3125], loss: 0.353, per_step_time: 1413ms, lr: 9.970979e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:19,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.65809 samples/s/p 3:26:55 } +2024-07-30 02:40:22,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 596/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 9.970605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:22,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.65777 samples/s/p 3:26:53 } +2024-07-30 02:40:25,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 598/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 9.970231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:25,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.65917 samples/s/p 3:26:47 } +2024-07-30 02:40:27,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 600/ 3125], loss: 0.290, per_step_time: 1415ms, lr: 9.969853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:27,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.65345 samples/s/p 3:26:57 } +2024-07-30 02:40:30,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 602/ 3125], loss: 0.510, per_step_time: 1413ms, lr: 9.969473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:30,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.65925 samples/s/p 3:26:41 } +2024-07-30 02:40:33,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 604/ 3125], loss: 0.393, per_step_time: 1413ms, lr: 9.96909e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:33,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.65968 samples/s/p 3:26:37 } +2024-07-30 02:40:36,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 606/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 9.968706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:36,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.65928 samples/s/p 3:26:35 } +2024-07-30 02:40:39,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 608/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 9.968318e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:39,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.65828 samples/s/p 3:26:35 } +2024-07-30 02:40:42,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 610/ 3125], loss: 0.314, per_step_time: 1412ms, lr: 9.967929e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:42,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.66185 samples/s/p 3:26:24 } +2024-07-30 02:40:44,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 612/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 9.967536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:44,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.66110 samples/s/p 3:26:23 } +2024-07-30 02:40:47,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 614/ 3125], loss: 0.292, per_step_time: 1413ms, lr: 9.967143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:47,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.65839 samples/s/p 3:26:26 } +2024-07-30 02:40:50,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 616/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 9.966746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:50,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.66041 samples/s/p 3:26:19 } +2024-07-30 02:40:53,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 618/ 3125], loss: 0.285, per_step_time: 1415ms, lr: 9.966347e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:53,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.65099 samples/s/p 3:26:37 } +2024-07-30 02:40:56,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 620/ 3125], loss: 0.511, per_step_time: 1413ms, lr: 9.9659455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:56,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.66140 samples/s/p 3:26:11 } +2024-07-30 02:40:59,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 622/ 3125], loss: 0.245, per_step_time: 1414ms, lr: 9.965543e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:59,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.65683 samples/s/p 3:26:18 } +2024-07-30 02:41:02,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 624/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 9.965136e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:02,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.66065 samples/s/p 3:26:07 } +2024-07-30 02:41:04,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 626/ 3125], loss: 0.162, per_step_time: 1412ms, lr: 9.964728e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:04,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.66220 samples/s/p 3:26:01 } +2024-07-30 02:41:07,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 628/ 3125], loss: 0.399, per_step_time: 1413ms, lr: 9.964317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:07,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.65929 samples/s/p 3:26:04 } +2024-07-30 02:41:10,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 630/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 9.963903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:10,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.66056 samples/s/p 3:25:59 } +2024-07-30 02:41:13,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 632/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 9.963488e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:13,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.66073 samples/s/p 3:25:56 } +2024-07-30 02:41:16,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 634/ 3125], loss: 0.229, per_step_time: 1415ms, lr: 9.96307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:16,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.65154 samples/s/p 3:26:13 } +2024-07-30 02:41:19,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 636/ 3125], loss: 0.381, per_step_time: 1414ms, lr: 9.96265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:19,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.65576 samples/s/p 3:26:01 } +2024-07-30 02:41:21,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 638/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 9.9622275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:21,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.66103 samples/s/p 3:25:46 } +2024-07-30 02:41:24,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 640/ 3125], loss: 0.256, per_step_time: 1412ms, lr: 9.961802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:24,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.66298 samples/s/p 3:25:39 } +2024-07-30 02:41:27,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 642/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 9.961374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:27,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.65892 samples/s/p 3:25:45 } +2024-07-30 02:41:30,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 644/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 9.960944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:30,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.65861 samples/s/p 3:25:43 } +2024-07-30 02:41:33,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 646/ 3125], loss: 0.375, per_step_time: 1414ms, lr: 9.960513e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:33,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.65617 samples/s/p 3:25:46 } +2024-07-30 02:41:36,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 648/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 9.9600775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:36,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.65977 samples/s/p 3:25:35 } +2024-07-30 02:41:38,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 650/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 9.959642e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:38,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.65918 samples/s/p 3:25:33 } +2024-07-30 02:41:41,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 652/ 3125], loss: 0.269, per_step_time: 1414ms, lr: 9.9592025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:41,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.65752 samples/s/p 3:25:34 } +2024-07-30 02:41:44,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 654/ 3125], loss: 0.319, per_step_time: 1414ms, lr: 9.9587605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:44,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.65570 samples/s/p 3:25:35 } +2024-07-30 02:41:47,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 656/ 3125], loss: 0.389, per_step_time: 1414ms, lr: 9.958317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:47,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.65749 samples/s/p 3:25:29 } +2024-07-30 02:41:50,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 658/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 9.95787e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:50,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.65984 samples/s/p 3:25:21 } +2024-07-30 02:41:53,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 660/ 3125], loss: 0.096, per_step_time: 1412ms, lr: 9.957421e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:53,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.66230 samples/s/p 3:25:13 } +2024-07-30 02:41:55,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 662/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 9.95697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:55,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.65888 samples/s/p 3:25:17 } +2024-07-30 02:41:58,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 664/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 9.956517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:58,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.65951 samples/s/p 3:25:13 } +2024-07-30 02:42:01,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 666/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 9.95606e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:01,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.66157 samples/s/p 3:25:06 } +2024-07-30 02:42:04,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 668/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 9.955603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:04,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.65843 samples/s/p 3:25:10 } +2024-07-30 02:42:07,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 670/ 3125], loss: 0.103, per_step_time: 1413ms, lr: 9.955142e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:07,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.66010 samples/s/p 3:25:03 } +2024-07-30 02:42:10,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 672/ 3125], loss: 0.347, per_step_time: 1412ms, lr: 9.95468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:10,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.66210 samples/s/p 3:24:56 } +2024-07-30 02:42:12,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 674/ 3125], loss: 0.503, per_step_time: 1413ms, lr: 9.954214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:12,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.66124 samples/s/p 3:24:55 } +2024-07-30 02:42:15,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 676/ 3125], loss: 0.388, per_step_time: 1414ms, lr: 9.953746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:15,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.65404 samples/s/p 3:25:08 } +2024-07-30 02:42:18,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 678/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 9.953275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:18,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.65937 samples/s/p 3:24:53 } +2024-07-30 02:42:21,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 680/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 9.952803e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:21,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.65985 samples/s/p 3:24:50 } +2024-07-30 02:42:24,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 682/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 9.9523295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:24,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.65777 samples/s/p 3:24:51 } +2024-07-30 02:42:27,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 684/ 3125], loss: 0.480, per_step_time: 1414ms, lr: 9.951851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:27,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.65739 samples/s/p 3:24:49 } +2024-07-30 02:42:29,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 686/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 9.951372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:29,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.65977 samples/s/p 3:24:41 } +2024-07-30 02:42:32,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 688/ 3125], loss: 0.346, per_step_time: 1412ms, lr: 9.950891e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:32,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.66183 samples/s/p 3:24:34 } +2024-07-30 02:42:35,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 690/ 3125], loss: 0.391, per_step_time: 1413ms, lr: 9.950406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:35,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.65804 samples/s/p 3:24:39 } +2024-07-30 02:42:38,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 692/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 9.94992e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:38,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.65902 samples/s/p 3:24:34 } +2024-07-30 02:42:41,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 694/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 9.949431e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:41,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.66130 samples/s/p 3:24:27 } +2024-07-30 02:42:44,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 696/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 9.948939e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:44,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.66149 samples/s/p 3:24:23 } +2024-07-30 02:42:46,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 698/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 9.948445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:46,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.66121 samples/s/p 3:24:21 } +2024-07-30 02:42:49,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 700/ 3125], loss: 0.344, per_step_time: 1413ms, lr: 9.947949e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:49,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.66070 samples/s/p 3:24:19 } +2024-07-30 02:42:52,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 702/ 3125], loss: 0.373, per_step_time: 1416ms, lr: 9.947451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:52,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.64847 samples/s/p 3:24:43 } +2024-07-30 02:42:55,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 704/ 3125], loss: 0.209, per_step_time: 1414ms, lr: 9.946951e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:55,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.65557 samples/s/p 3:24:25 } +2024-07-30 02:42:58,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 706/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 9.946447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:58,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.66139 samples/s/p 3:24:09 } +2024-07-30 02:43:01,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 708/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 9.945942e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:01,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.65992 samples/s/p 3:24:10 } +2024-07-30 02:43:03,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 710/ 3125], loss: 0.420, per_step_time: 1412ms, lr: 9.945434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:03,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.66214 samples/s/p 3:24:02 } +2024-07-30 02:43:06,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 712/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 9.9449235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:06,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.66094 samples/s/p 3:24:02 } +2024-07-30 02:43:09,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 714/ 3125], loss: 0.459, per_step_time: 1412ms, lr: 9.944411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:09,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.66256 samples/s/p 3:23:56 } +2024-07-30 02:43:12,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 716/ 3125], loss: 0.372, per_step_time: 1412ms, lr: 9.943897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:12,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.66243 samples/s/p 3:23:53 } +2024-07-30 02:43:15,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 718/ 3125], loss: 0.225, per_step_time: 1412ms, lr: 9.943379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:15,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.66186 samples/s/p 3:23:52 } +2024-07-30 02:43:18,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 720/ 3125], loss: 0.246, per_step_time: 1412ms, lr: 9.942859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:18,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.66242 samples/s/p 3:23:47 } +2024-07-30 02:43:20,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 722/ 3125], loss: 0.310, per_step_time: 1414ms, lr: 9.942337e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:20,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.65639 samples/s/p 3:23:58 } +2024-07-30 02:43:23,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 724/ 3125], loss: 0.183, per_step_time: 1414ms, lr: 9.941812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:23,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.65467 samples/s/p 3:23:59 } +2024-07-30 02:43:26,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 726/ 3125], loss: 0.421, per_step_time: 1414ms, lr: 9.941286e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:26,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.65523 samples/s/p 3:23:55 } +2024-07-30 02:43:29,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 728/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 9.940757e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:29,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.65962 samples/s/p 3:23:42 } +2024-07-30 02:43:32,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 730/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 9.940226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:32,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.65790 samples/s/p 3:23:43 } +2024-07-30 02:43:35,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 732/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 9.939692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:35,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.65797 samples/s/p 3:23:40 } +2024-07-30 02:43:37,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 734/ 3125], loss: 0.373, per_step_time: 1413ms, lr: 9.9391555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:37,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.66140 samples/s/p 3:23:30 } +2024-07-30 02:43:40,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 736/ 3125], loss: 0.418, per_step_time: 1413ms, lr: 9.938616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:40,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.66111 samples/s/p 3:23:28 } +2024-07-30 02:43:43,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 738/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 9.938076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:43,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.65955 samples/s/p 3:23:28 } +2024-07-30 02:43:46,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 740/ 3125], loss: 0.420, per_step_time: 1412ms, lr: 9.937533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:46,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.66239 samples/s/p 3:23:19 } +2024-07-30 02:43:49,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 742/ 3125], loss: 0.164, per_step_time: 1414ms, lr: 9.936987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:49,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.65738 samples/s/p 3:23:27 } +2024-07-30 02:43:52,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 744/ 3125], loss: 0.265, per_step_time: 1415ms, lr: 9.93644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:52,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.65239 samples/s/p 3:23:35 } +2024-07-30 02:43:54,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 746/ 3125], loss: 0.220, per_step_time: 1415ms, lr: 9.935889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:54,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |███ | 5.65172 samples/s/p 3:23:34 } +2024-07-30 02:43:57,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 748/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 9.9353365e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:57,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |███ | 5.65942 samples/s/p 3:23:14 } +2024-07-30 02:44:00,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 750/ 3125], loss: 0.195, per_step_time: 1414ms, lr: 9.934782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:00,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.65571 samples/s/p 3:23:20 } +2024-07-30 02:44:03,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 752/ 3125], loss: 0.465, per_step_time: 1414ms, lr: 9.934223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:03,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.65628 samples/s/p 3:23:15 } +2024-07-30 02:44:06,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 754/ 3125], loss: 0.249, per_step_time: 1414ms, lr: 9.933664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:06,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.65740 samples/s/p 3:23:10 } +2024-07-30 02:44:09,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 756/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 9.933102e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:09,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.66161 samples/s/p 3:22:58 } +2024-07-30 02:44:11,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 758/ 3125], loss: 0.390, per_step_time: 1413ms, lr: 9.932538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:11,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.66045 samples/s/p 3:22:58 } +2024-07-30 02:44:14,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 760/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 9.931971e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:14,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.66127 samples/s/p 3:22:53 } +2024-07-30 02:44:17,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 762/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 9.931402e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:17,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.65988 samples/s/p 3:22:54 } +2024-07-30 02:44:20,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 764/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 9.93083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:20,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.66042 samples/s/p 3:22:50 } +2024-07-30 02:44:23,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 766/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 9.930256e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:23,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.66035 samples/s/p 3:22:47 } +2024-07-30 02:44:26,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 768/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 9.92968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:26,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.66048 samples/s/p 3:22:44 } +2024-07-30 02:44:28,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 770/ 3125], loss: 0.407, per_step_time: 1420ms, lr: 9.929101e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:28,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.63318 samples/s/p 3:23:40 } +2024-07-30 02:44:31,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 772/ 3125], loss: 0.230, per_step_time: 1421ms, lr: 9.928521e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:31,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.62909 samples/s/p 3:23:46 } +2024-07-30 02:44:34,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 774/ 3125], loss: 0.346, per_step_time: 1417ms, lr: 9.927937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:34,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.64516 samples/s/p 3:23:08 } +2024-07-30 02:44:37,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 776/ 3125], loss: 0.453, per_step_time: 1416ms, lr: 9.927351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:37,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.64846 samples/s/p 3:22:58 } +2024-07-30 02:44:40,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 778/ 3125], loss: 0.332, per_step_time: 1415ms, lr: 9.926764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:40,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.64995 samples/s/p 3:22:52 } +2024-07-30 02:44:43,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 780/ 3125], loss: 0.240, per_step_time: 1415ms, lr: 9.926173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:43,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.64994 samples/s/p 3:22:50 } +2024-07-30 02:44:45,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 782/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 9.92558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:45,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.65917 samples/s/p 3:22:27 } +2024-07-30 02:44:48,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 784/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 9.9249855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:48,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.65978 samples/s/p 3:22:23 } +2024-07-30 02:44:51,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 786/ 3125], loss: 0.095, per_step_time: 1414ms, lr: 9.924388e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:51,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.65562 samples/s/p 3:22:29 } +2024-07-30 02:44:54,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 788/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 9.923788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:54,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.66033 samples/s/p 3:22:16 } +2024-07-30 02:44:57,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 790/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 9.923186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:57,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.65845 samples/s/p 3:22:17 } +2024-07-30 02:45:00,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 792/ 3125], loss: 0.344, per_step_time: 1413ms, lr: 9.922582e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:00,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.66001 samples/s/p 3:22:11 } +2024-07-30 02:45:02,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 794/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 9.921975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:02,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.65920 samples/s/p 3:22:10 } +2024-07-30 02:45:05,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 796/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 9.921366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:05,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.66051 samples/s/p 3:22:04 } +2024-07-30 02:45:08,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 798/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 9.920755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:08,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.65933 samples/s/p 3:22:04 } +2024-07-30 02:45:11,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 800/ 3125], loss: 0.499, per_step_time: 1413ms, lr: 9.920141e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:11,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.65990 samples/s/p 3:22:00 } +2024-07-30 02:45:14,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 802/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 9.919525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:14,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.65871 samples/s/p 3:22:00 } +2024-07-30 02:45:17,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 804/ 3125], loss: 0.189, per_step_time: 1414ms, lr: 9.918906e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:17,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.65733 samples/s/p 3:22:00 } +2024-07-30 02:45:19,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 806/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 9.918285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:19,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.65868 samples/s/p 3:21:54 } +2024-07-30 02:45:22,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 808/ 3125], loss: 0.374, per_step_time: 1414ms, lr: 9.917661e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:22,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.65397 samples/s/p 3:22:01 } +2024-07-30 02:45:25,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 810/ 3125], loss: 0.288, per_step_time: 1421ms, lr: 9.917036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:25,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.62644 samples/s/p 3:22:58 } +2024-07-30 02:45:28,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 812/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 9.916408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:28,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.65938 samples/s/p 3:21:44 } +2024-07-30 02:45:31,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 814/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 9.915778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:31,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.66019 samples/s/p 3:21:39 } +2024-07-30 02:45:34,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 816/ 3125], loss: 0.241, per_step_time: 1416ms, lr: 9.915146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:34,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.64670 samples/s/p 3:22:06 } +2024-07-30 02:45:37,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 818/ 3125], loss: 0.152, per_step_time: 1425ms, lr: 9.91451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:37,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.61198 samples/s/p 3:23:18 } +2024-07-30 02:45:39,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 820/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 9.913872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:39,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.66066 samples/s/p 3:21:30 } +2024-07-30 02:45:42,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 822/ 3125], loss: 0.183, per_step_time: 1418ms, lr: 9.913233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:42,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.64045 samples/s/p 3:22:10 } +2024-07-30 02:45:45,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 824/ 3125], loss: 0.277, per_step_time: 1412ms, lr: 9.912591e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:45,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.66192 samples/s/p 3:21:22 } +2024-07-30 02:45:48,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 826/ 3125], loss: 0.379, per_step_time: 1413ms, lr: 9.911947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:48,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.66002 samples/s/p 3:21:23 } +2024-07-30 02:45:51,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 828/ 3125], loss: 0.211, per_step_time: 1426ms, lr: 9.9112995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:51,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.60921 samples/s/p 3:23:09 } +2024-07-30 02:45:54,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 830/ 3125], loss: 0.451, per_step_time: 1412ms, lr: 9.910651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:54,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.66215 samples/s/p 3:21:13 } +2024-07-30 02:45:56,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 832/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 9.909999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:56,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.66047 samples/s/p 3:21:13 } +2024-07-30 02:45:59,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 834/ 3125], loss: 0.497, per_step_time: 1413ms, lr: 9.909346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:59,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.65921 samples/s/p 3:21:13 } +2024-07-30 02:46:02,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 836/ 3125], loss: 0.101, per_step_time: 1413ms, lr: 9.908689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:02,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.66093 samples/s/p 3:21:07 } +2024-07-30 02:46:05,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 838/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 9.908032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:05,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.66026 samples/s/p 3:21:05 } +2024-07-30 02:46:08,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 840/ 3125], loss: 0.184, per_step_time: 1412ms, lr: 9.90737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:08,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.66217 samples/s/p 3:20:58 } +2024-07-30 02:46:11,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 842/ 3125], loss: 0.334, per_step_time: 1413ms, lr: 9.906707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:11,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.66000 samples/s/p 3:21:00 } +2024-07-30 02:46:13,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 844/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 9.906042e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:13,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.65861 samples/s/p 3:21:00 } +2024-07-30 02:46:16,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 846/ 3125], loss: 0.305, per_step_time: 1417ms, lr: 9.905374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:16,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.64545 samples/s/p 3:21:26 } +2024-07-30 02:46:19,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 848/ 3125], loss: 0.206, per_step_time: 1414ms, lr: 9.904704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:19,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.65767 samples/s/p 3:20:57 } +2024-07-30 02:46:22,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 850/ 3125], loss: 0.367, per_step_time: 1413ms, lr: 9.904032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:22,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.65983 samples/s/p 3:20:49 } +2024-07-30 02:46:25,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 852/ 3125], loss: 0.207, per_step_time: 1414ms, lr: 9.903357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:25,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.65498 samples/s/p 3:20:57 } +2024-07-30 02:46:28,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 854/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 9.902679e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:28,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.66002 samples/s/p 3:20:43 } +2024-07-30 02:46:30,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 856/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 9.902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:30,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.65873 samples/s/p 3:20:43 } +2024-07-30 02:46:33,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 858/ 3125], loss: 0.175, per_step_time: 1416ms, lr: 9.901319e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:33,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.64879 samples/s/p 3:21:02 } +2024-07-30 02:46:36,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 860/ 3125], loss: 0.427, per_step_time: 1414ms, lr: 9.900634e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:36,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.65489 samples/s/p 3:20:46 } +2024-07-30 02:46:39,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 862/ 3125], loss: 0.467, per_step_time: 1413ms, lr: 9.899947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:39,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.66022 samples/s/p 3:20:32 } +2024-07-30 02:46:42,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 864/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 9.899259e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:42,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.65852 samples/s/p 3:20:32 } +2024-07-30 02:46:45,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 866/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 9.8985665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:45,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.66098 samples/s/p 3:20:24 } +2024-07-30 02:46:47,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 868/ 3125], loss: 0.273, per_step_time: 1414ms, lr: 9.8978735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:47,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.65746 samples/s/p 3:20:29 } +2024-07-30 02:46:50,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 870/ 3125], loss: 0.532, per_step_time: 1413ms, lr: 9.897178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:50,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.66109 samples/s/p 3:20:18 } +2024-07-30 02:46:53,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 872/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 9.896479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:53,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.65768 samples/s/p 3:20:23 } +2024-07-30 02:46:56,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 874/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 9.895779e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:56,448 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.65989 samples/s/p 3:20:15 } +2024-07-30 02:46:59,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 876/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 9.895076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:59,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.66160 samples/s/p 3:20:09 } +2024-07-30 02:47:02,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 878/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 9.894371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:02,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.66118 samples/s/p 3:20:07 } +2024-07-30 02:47:04,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 880/ 3125], loss: 0.185, per_step_time: 1414ms, lr: 9.893663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:04,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.65462 samples/s/p 3:20:18 } +2024-07-30 02:47:07,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 882/ 3125], loss: 0.394, per_step_time: 1413ms, lr: 9.892953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:07,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.66156 samples/s/p 3:20:00 } +2024-07-30 02:47:10,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 884/ 3125], loss: 0.114, per_step_time: 1413ms, lr: 9.892241e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:10,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.65987 samples/s/p 3:20:01 } +2024-07-30 02:47:13,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 886/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 9.891526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:13,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.66111 samples/s/p 3:19:56 } +2024-07-30 02:47:16,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 888/ 3125], loss: 0.273, per_step_time: 1415ms, lr: 9.890809e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:16,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.65308 samples/s/p 3:20:10 } +2024-07-30 02:47:19,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 890/ 3125], loss: 0.151, per_step_time: 1412ms, lr: 9.89009e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:19,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.66258 samples/s/p 3:19:47 } +2024-07-30 02:47:21,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 892/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 9.889369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:21,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.65978 samples/s/p 3:19:50 } +2024-07-30 02:47:24,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 894/ 3125], loss: 0.480, per_step_time: 1414ms, lr: 9.888645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:24,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.65653 samples/s/p 3:19:54 } +2024-07-30 02:47:27,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 896/ 3125], loss: 0.519, per_step_time: 1414ms, lr: 9.887918e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:27,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.65697 samples/s/p 3:19:50 } +2024-07-30 02:47:30,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 898/ 3125], loss: 0.440, per_step_time: 1413ms, lr: 9.88719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:30,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.65790 samples/s/p 3:19:46 } +2024-07-30 02:47:33,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 900/ 3125], loss: 0.373, per_step_time: 1412ms, lr: 9.886458e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:33,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.66216 samples/s/p 3:19:34 } +2024-07-30 02:47:36,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 902/ 3125], loss: 0.330, per_step_time: 1413ms, lr: 9.885725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:36,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.65998 samples/s/p 3:19:36 } +2024-07-30 02:47:38,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 904/ 3125], loss: 0.195, per_step_time: 1414ms, lr: 9.8849905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:38,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.65727 samples/s/p 3:19:38 } +2024-07-30 02:47:41,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 906/ 3125], loss: 0.260, per_step_time: 1414ms, lr: 9.884252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:41,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.65738 samples/s/p 3:19:35 } +2024-07-30 02:47:44,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 908/ 3125], loss: 0.134, per_step_time: 1414ms, lr: 9.883512e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:44,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.65758 samples/s/p 3:19:32 } +2024-07-30 02:47:47,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 910/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 9.8827695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:47,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.65831 samples/s/p 3:19:28 } +2024-07-30 02:47:50,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 912/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 9.882025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:50,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.66059 samples/s/p 3:19:20 } +2024-07-30 02:47:53,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 914/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 9.881277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:53,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.65990 samples/s/p 3:19:19 } +2024-07-30 02:47:55,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 916/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 9.8805285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:55,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.66105 samples/s/p 3:19:13 } +2024-07-30 02:47:58,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 918/ 3125], loss: 0.065, per_step_time: 1413ms, lr: 9.879776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:58,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.65909 samples/s/p 3:19:15 } +2024-07-30 02:48:01,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 920/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 9.8790215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:01,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.65863 samples/s/p 3:19:13 } +2024-07-30 02:48:04,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 922/ 3125], loss: 0.426, per_step_time: 1414ms, lr: 9.878265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:04,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.65653 samples/s/p 3:19:15 } +2024-07-30 02:48:07,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 924/ 3125], loss: 0.222, per_step_time: 1414ms, lr: 9.877506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:07,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.65389 samples/s/p 3:19:17 } +2024-07-30 02:48:10,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 926/ 3125], loss: 0.194, per_step_time: 1414ms, lr: 9.876745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:10,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.65735 samples/s/p 3:19:07 } +2024-07-30 02:48:12,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 928/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 9.875981e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:12,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.65926 samples/s/p 3:19:00 } +2024-07-30 02:48:15,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 930/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 9.875215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:15,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.65780 samples/s/p 3:19:01 } +2024-07-30 02:48:18,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 932/ 3125], loss: 0.094, per_step_time: 1413ms, lr: 9.874447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:18,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.66065 samples/s/p 3:18:52 } +2024-07-30 02:48:21,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 934/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 9.873676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:21,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |████ | 5.65517 samples/s/p 3:19:00 } +2024-07-30 02:48:24,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 936/ 3125], loss: 0.248, per_step_time: 1424ms, lr: 9.872903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:24,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |████ | 5.61420 samples/s/p 3:20:25 } +2024-07-30 02:48:27,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 938/ 3125], loss: 0.110, per_step_time: 1413ms, lr: 9.872128e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:27,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.65947 samples/s/p 3:18:46 } +2024-07-30 02:48:30,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 940/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 9.871351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:30,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.66011 samples/s/p 3:18:42 } +2024-07-30 02:48:32,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 942/ 3125], loss: 0.095, per_step_time: 1413ms, lr: 9.8705705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:32,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.66147 samples/s/p 3:18:36 } +2024-07-30 02:48:35,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 944/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 9.869788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:35,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.66032 samples/s/p 3:18:35 } +2024-07-30 02:48:38,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 946/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 9.869004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:38,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.66170 samples/s/p 3:18:30 } +2024-07-30 02:48:41,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 948/ 3125], loss: 0.341, per_step_time: 1412ms, lr: 9.868218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:41,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.66190 samples/s/p 3:18:26 } +2024-07-30 02:48:44,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 950/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 9.867428e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:44,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.66068 samples/s/p 3:18:26 } +2024-07-30 02:48:47,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 952/ 3125], loss: 0.520, per_step_time: 1413ms, lr: 9.866637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:47,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.66122 samples/s/p 3:18:22 } +2024-07-30 02:48:49,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 954/ 3125], loss: 0.370, per_step_time: 1412ms, lr: 9.865843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:49,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.66196 samples/s/p 3:18:18 } +2024-07-30 02:48:52,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 956/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 9.865046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:52,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.66130 samples/s/p 3:18:16 } +2024-07-30 02:48:55,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 958/ 3125], loss: 0.088, per_step_time: 1417ms, lr: 9.864249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:55,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.64477 samples/s/p 3:18:48 } +2024-07-30 02:48:58,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 960/ 3125], loss: 0.254, per_step_time: 1416ms, lr: 9.863448e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:58,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.64932 samples/s/p 3:18:36 } +2024-07-30 02:49:01,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 962/ 3125], loss: 0.118, per_step_time: 1422ms, lr: 9.862644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:01,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.62492 samples/s/p 3:19:25 } +2024-07-30 02:49:04,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 964/ 3125], loss: 0.348, per_step_time: 1413ms, lr: 9.861839e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:04,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.65798 samples/s/p 3:18:12 } +2024-07-30 02:49:06,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 966/ 3125], loss: 0.515, per_step_time: 1413ms, lr: 9.861032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:06,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.65875 samples/s/p 3:18:08 } +2024-07-30 02:49:09,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 968/ 3125], loss: 0.405, per_step_time: 1415ms, lr: 9.860221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:09,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.65036 samples/s/p 3:18:22 } +2024-07-30 02:49:12,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 970/ 3125], loss: 0.535, per_step_time: 1413ms, lr: 9.859409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:12,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.65872 samples/s/p 3:18:02 } +2024-07-30 02:49:15,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 972/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 9.858593e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:15,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.65991 samples/s/p 3:17:57 } +2024-07-30 02:49:18,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 974/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 9.8577775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:18,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.65968 samples/s/p 3:17:54 } +2024-07-30 02:49:21,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 976/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 9.856958e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:21,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.66017 samples/s/p 3:17:51 } +2024-07-30 02:49:23,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 978/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 9.856137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:23,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.66072 samples/s/p 3:17:47 } +2024-07-30 02:49:26,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 980/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 9.855313e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:26,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.66068 samples/s/p 3:17:44 } +2024-07-30 02:49:29,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 982/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 9.854486e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:29,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.65950 samples/s/p 3:17:43 } +2024-07-30 02:49:32,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 984/ 3125], loss: 0.367, per_step_time: 1413ms, lr: 9.8536575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:32,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.65978 samples/s/p 3:17:40 } +2024-07-30 02:49:35,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 986/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 9.852827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:35,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.65918 samples/s/p 3:17:38 } +2024-07-30 02:49:38,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 988/ 3125], loss: 0.293, per_step_time: 1413ms, lr: 9.851993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:38,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.66054 samples/s/p 3:17:33 } +2024-07-30 02:49:40,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 990/ 3125], loss: 0.241, per_step_time: 1414ms, lr: 9.851158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:40,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.65726 samples/s/p 3:17:37 } +2024-07-30 02:49:43,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 992/ 3125], loss: 0.267, per_step_time: 1416ms, lr: 9.85032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:43,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.64704 samples/s/p 3:17:55 } +2024-07-30 02:49:46,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 994/ 3125], loss: 0.263, per_step_time: 1414ms, lr: 9.849479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:46,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.65769 samples/s/p 3:17:30 } +2024-07-30 02:49:49,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 996/ 3125], loss: 0.733, per_step_time: 1413ms, lr: 9.848637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:49,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.65861 samples/s/p 3:17:26 } +2024-07-30 02:49:52,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 998/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 9.847792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:52,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.65610 samples/s/p 3:17:28 } +2024-07-30 02:49:55,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1000/ 3125], loss: 0.555, per_step_time: 1413ms, lr: 9.846945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:55,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.65866 samples/s/p 3:17:20 } +2024-07-30 02:49:57,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1002/ 3125], loss: 0.196, per_step_time: 1415ms, lr: 9.846096e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:57,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.65225 samples/s/p 3:17:30 } +2024-07-30 02:50:00,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1004/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 9.845244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:00,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.66049 samples/s/p 3:17:10 } +2024-07-30 02:50:03,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1006/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 9.84439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:03,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.65727 samples/s/p 3:17:14 } +2024-07-30 02:50:06,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1008/ 3125], loss: 0.251, per_step_time: 1414ms, lr: 9.843533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:06,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.65477 samples/s/p 3:17:17 } +2024-07-30 02:50:09,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1010/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 9.842675e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:09,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.65845 samples/s/p 3:17:06 } +2024-07-30 02:50:12,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1012/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 9.841814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:12,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.65986 samples/s/p 3:17:00 } +2024-07-30 02:50:14,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1014/ 3125], loss: 0.384, per_step_time: 1412ms, lr: 9.840951e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:14,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.66224 samples/s/p 3:16:52 } +2024-07-30 02:50:17,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1016/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 9.840085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:17,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.66054 samples/s/p 3:16:53 } +2024-07-30 02:50:20,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1018/ 3125], loss: 0.232, per_step_time: 1416ms, lr: 9.839217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:20,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.64642 samples/s/p 3:17:20 } +2024-07-30 02:50:23,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1020/ 3125], loss: 0.114, per_step_time: 1413ms, lr: 9.838346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:23,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.65980 samples/s/p 3:16:49 } +2024-07-30 02:50:26,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1022/ 3125], loss: 0.533, per_step_time: 1413ms, lr: 9.837474e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:26,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.65950 samples/s/p 3:16:47 } +2024-07-30 02:50:29,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1024/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 9.836599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:29,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.65998 samples/s/p 3:16:43 } +2024-07-30 02:50:31,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1026/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 9.835722e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:31,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.66128 samples/s/p 3:16:38 } +2024-07-30 02:50:34,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1028/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 9.834843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:34,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.66032 samples/s/p 3:16:37 } +2024-07-30 02:50:37,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1030/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 9.833961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:37,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.66057 samples/s/p 3:16:33 } +2024-07-30 02:50:40,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1032/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 9.833077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:40,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.66037 samples/s/p 3:16:31 } +2024-07-30 02:50:43,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1034/ 3125], loss: 0.209, per_step_time: 1412ms, lr: 9.83219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:43,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.66255 samples/s/p 3:16:24 } +2024-07-30 02:50:46,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1036/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 9.831302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:46,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.66062 samples/s/p 3:16:25 } +2024-07-30 02:50:48,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1038/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 9.83041e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:48,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.66147 samples/s/p 3:16:20 } +2024-07-30 02:50:51,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1040/ 3125], loss: 0.089, per_step_time: 1412ms, lr: 9.829518e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:51,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.66209 samples/s/p 3:16:16 } +2024-07-30 02:50:54,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1042/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 9.828622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:54,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.66007 samples/s/p 3:16:17 } +2024-07-30 02:50:57,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1044/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 9.827724e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:57,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.66083 samples/s/p 3:16:13 } +2024-07-30 02:51:00,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1046/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 9.826823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:00,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.65856 samples/s/p 3:16:15 } +2024-07-30 02:51:03,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1048/ 3125], loss: 0.387, per_step_time: 1414ms, lr: 9.825921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:03,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.65586 samples/s/p 3:16:18 } +2024-07-30 02:51:05,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1050/ 3125], loss: 0.237, per_step_time: 1414ms, lr: 9.825016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:05,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.65660 samples/s/p 3:16:13 } +2024-07-30 02:51:08,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1052/ 3125], loss: 0.115, per_step_time: 1413ms, lr: 9.824109e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:08,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.66037 samples/s/p 3:16:03 } +2024-07-30 02:51:11,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1054/ 3125], loss: 0.151, per_step_time: 1414ms, lr: 9.8231985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:11,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.65674 samples/s/p 3:16:07 } +2024-07-30 02:51:14,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1056/ 3125], loss: 0.353, per_step_time: 1413ms, lr: 9.822287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:14,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.66006 samples/s/p 3:15:58 } +2024-07-30 02:51:17,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1058/ 3125], loss: 0.219, per_step_time: 1416ms, lr: 9.821373e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:17,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.64679 samples/s/p 3:16:22 } +2024-07-30 02:51:20,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1060/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 9.820457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:20,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.66038 samples/s/p 3:15:51 } +2024-07-30 02:51:22,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1062/ 3125], loss: 0.295, per_step_time: 1415ms, lr: 9.819539e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:22,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.65318 samples/s/p 3:16:04 } +2024-07-30 02:51:25,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1064/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 9.8186165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:25,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.66062 samples/s/p 3:15:45 } +2024-07-30 02:51:28,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1066/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 9.817693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:28,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.66019 samples/s/p 3:15:43 } +2024-07-30 02:51:31,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1068/ 3125], loss: 0.271, per_step_time: 1412ms, lr: 9.8167675e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:31,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.66259 samples/s/p 3:15:35 } +2024-07-30 02:51:34,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1070/ 3125], loss: 0.564, per_step_time: 1413ms, lr: 9.815841e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:34,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.65914 samples/s/p 3:15:40 } +2024-07-30 02:51:37,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1072/ 3125], loss: 0.245, per_step_time: 1412ms, lr: 9.81491e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:37,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.66179 samples/s/p 3:15:31 } +2024-07-30 02:51:39,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1074/ 3125], loss: 0.383, per_step_time: 1414ms, lr: 9.813978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:39,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.65603 samples/s/p 3:15:41 } +2024-07-30 02:51:42,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1076/ 3125], loss: 0.429, per_step_time: 1413ms, lr: 9.813043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:42,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.66060 samples/s/p 3:15:28 } +2024-07-30 02:51:45,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1078/ 3125], loss: 0.408, per_step_time: 1413ms, lr: 9.812105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:45,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.66170 samples/s/p 3:15:23 } +2024-07-30 02:51:48,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1080/ 3125], loss: 0.149, per_step_time: 1412ms, lr: 9.811166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:48,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.66281 samples/s/p 3:15:18 } +2024-07-30 02:51:51,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1082/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 9.810225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:51,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.65912 samples/s/p 3:15:23 } +2024-07-30 02:51:54,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1084/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 9.8092805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:54,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.66162 samples/s/p 3:15:15 } +2024-07-30 02:51:56,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1086/ 3125], loss: 0.335, per_step_time: 1412ms, lr: 9.808335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:56,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.66220 samples/s/p 3:15:11 } +2024-07-30 02:51:59,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1088/ 3125], loss: 0.302, per_step_time: 1416ms, lr: 9.807386e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:59,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.64762 samples/s/p 3:15:38 } +2024-07-30 02:52:02,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1090/ 3125], loss: 0.307, per_step_time: 1415ms, lr: 9.806435e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:02,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.65082 samples/s/p 3:15:29 } +2024-07-30 02:52:05,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1092/ 3125], loss: 0.224, per_step_time: 1415ms, lr: 9.8054825e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:05,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.65306 samples/s/p 3:15:21 } +2024-07-30 02:52:08,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1094/ 3125], loss: 0.178, per_step_time: 1415ms, lr: 9.804527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:08,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.65359 samples/s/p 3:15:17 } +2024-07-30 02:52:11,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1096/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 9.803569e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:11,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.65932 samples/s/p 3:15:03 } +2024-07-30 02:52:13,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1098/ 3125], loss: 0.200, per_step_time: 1414ms, lr: 9.8026085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:13,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.65662 samples/s/p 3:15:05 } +2024-07-30 02:52:16,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1100/ 3125], loss: 0.426, per_step_time: 1414ms, lr: 9.801647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:16,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.65759 samples/s/p 3:15:01 } +2024-07-30 02:52:19,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1102/ 3125], loss: 0.628, per_step_time: 1413ms, lr: 9.800682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:19,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.65843 samples/s/p 3:14:56 } +2024-07-30 02:52:22,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1104/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 9.799715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:22,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.66124 samples/s/p 3:14:47 } +2024-07-30 02:52:25,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1106/ 3125], loss: 0.322, per_step_time: 1413ms, lr: 9.798746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:25,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.66082 samples/s/p 3:14:45 } +2024-07-30 02:52:28,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1108/ 3125], loss: 0.553, per_step_time: 1413ms, lr: 9.7977745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:28,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.66019 samples/s/p 3:14:44 } +2024-07-30 02:52:30,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1110/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 9.7968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:30,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.66108 samples/s/p 3:14:39 } +2024-07-30 02:52:33,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1112/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 9.795824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:33,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.65832 samples/s/p 3:14:42 } +2024-07-30 02:52:36,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1114/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 9.794847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:36,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.65957 samples/s/p 3:14:37 } +2024-07-30 02:52:39,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1116/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 9.7938655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:39,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.66035 samples/s/p 3:14:32 } +2024-07-30 02:52:42,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1118/ 3125], loss: 0.401, per_step_time: 1413ms, lr: 9.792882e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:42,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.66114 samples/s/p 3:14:28 } +2024-07-30 02:52:45,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1120/ 3125], loss: 0.297, per_step_time: 1412ms, lr: 9.791896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:45,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.66216 samples/s/p 3:14:23 } +2024-07-30 02:52:47,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1122/ 3125], loss: 0.198, per_step_time: 1414ms, lr: 9.790909e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:47,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |█████ | 5.65619 samples/s/p 3:14:32 } +2024-07-30 02:52:50,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1124/ 3125], loss: 0.094, per_step_time: 1416ms, lr: 9.789919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:50,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |█████ | 5.64852 samples/s/p 3:14:45 } +2024-07-30 02:52:53,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1126/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 9.788928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:53,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.66023 samples/s/p 3:14:18 } +2024-07-30 02:52:56,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1128/ 3125], loss: 0.300, per_step_time: 1416ms, lr: 9.787934e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:56,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.64646 samples/s/p 3:14:44 } +2024-07-30 02:52:59,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1130/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 9.786936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:59,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.66075 samples/s/p 3:14:12 } +2024-07-30 02:53:02,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1132/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 9.785938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:02,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.65983 samples/s/p 3:14:11 } +2024-07-30 02:53:05,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1134/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 9.784937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:05,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.65931 samples/s/p 3:14:09 } +2024-07-30 02:53:07,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1136/ 3125], loss: 0.150, per_step_time: 1412ms, lr: 9.783933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:07,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.66249 samples/s/p 3:14:00 } +2024-07-30 02:53:10,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1138/ 3125], loss: 0.158, per_step_time: 1414ms, lr: 9.782927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:10,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.65722 samples/s/p 3:14:08 } +2024-07-30 02:53:13,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1140/ 3125], loss: 0.321, per_step_time: 1413ms, lr: 9.781919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:13,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.66070 samples/s/p 3:13:58 } +2024-07-30 02:53:16,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1142/ 3125], loss: 0.248, per_step_time: 1414ms, lr: 9.780909e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:16,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.65686 samples/s/p 3:14:03 } +2024-07-30 02:53:19,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1144/ 3125], loss: 0.359, per_step_time: 1414ms, lr: 9.779896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:19,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.65417 samples/s/p 3:14:05 } +2024-07-30 02:53:22,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1146/ 3125], loss: 0.302, per_step_time: 1414ms, lr: 9.778881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:22,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.65726 samples/s/p 3:13:56 } +2024-07-30 02:53:24,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1148/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 9.777864e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:24,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.65927 samples/s/p 3:13:49 } +2024-07-30 02:53:27,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1150/ 3125], loss: 0.211, per_step_time: 1414ms, lr: 9.776844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:27,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.65617 samples/s/p 3:13:53 } +2024-07-30 02:53:30,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1152/ 3125], loss: 0.408, per_step_time: 1413ms, lr: 9.775823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:30,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.66079 samples/s/p 3:13:40 } +2024-07-30 02:53:33,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1154/ 3125], loss: 0.170, per_step_time: 1414ms, lr: 9.774798e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:33,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.65653 samples/s/p 3:13:46 } +2024-07-30 02:53:36,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1156/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 9.773771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:36,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.65882 samples/s/p 3:13:39 } +2024-07-30 02:53:39,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1158/ 3125], loss: 0.134, per_step_time: 1413ms, lr: 9.772743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:39,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.66062 samples/s/p 3:13:32 } +2024-07-30 02:53:41,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1160/ 3125], loss: 0.465, per_step_time: 1412ms, lr: 9.771713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:41,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.66210 samples/s/p 3:13:26 } +2024-07-30 02:53:44,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1162/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 9.770679e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:44,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.65774 samples/s/p 3:13:33 } +2024-07-30 02:53:47,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1164/ 3125], loss: 0.082, per_step_time: 1413ms, lr: 9.769644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:47,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.66122 samples/s/p 3:13:23 } +2024-07-30 02:53:50,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1166/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 9.768606e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:50,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.66113 samples/s/p 3:13:20 } +2024-07-30 02:53:53,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1168/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 9.767566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:53,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.66151 samples/s/p 3:13:16 } +2024-07-30 02:53:56,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1170/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 9.766523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:56,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.66161 samples/s/p 3:13:13 } +2024-07-30 02:53:58,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1172/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 9.765479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:58,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.65791 samples/s/p 3:13:18 } +2024-07-30 02:54:01,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1174/ 3125], loss: 0.124, per_step_time: 1416ms, lr: 9.764432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:01,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.64919 samples/s/p 3:13:33 } +2024-07-30 02:54:04,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1176/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 9.763384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:04,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.66077 samples/s/p 3:13:07 } +2024-07-30 02:54:07,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1178/ 3125], loss: 0.391, per_step_time: 1415ms, lr: 9.762332e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:07,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.65361 samples/s/p 3:13:18 } +2024-07-30 02:54:10,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1180/ 3125], loss: 0.177, per_step_time: 1414ms, lr: 9.761278e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:10,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.65679 samples/s/p 3:13:09 } +2024-07-30 02:54:13,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1182/ 3125], loss: 0.174, per_step_time: 1414ms, lr: 9.760222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:13,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.65713 samples/s/p 3:13:06 } +2024-07-30 02:54:15,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1184/ 3125], loss: 0.159, per_step_time: 1414ms, lr: 9.759164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:15,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.65625 samples/s/p 3:13:05 } +2024-07-30 02:54:18,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1186/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 9.758104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:18,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.65843 samples/s/p 3:12:57 } +2024-07-30 02:54:21,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1188/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 9.75704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:21,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.66042 samples/s/p 3:12:50 } +2024-07-30 02:54:24,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1190/ 3125], loss: 0.580, per_step_time: 1413ms, lr: 9.755976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:24,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.66095 samples/s/p 3:12:46 } +2024-07-30 02:54:27,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1192/ 3125], loss: 0.446, per_step_time: 1413ms, lr: 9.754908e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:27,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.65839 samples/s/p 3:12:49 } +2024-07-30 02:54:30,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1194/ 3125], loss: 0.293, per_step_time: 1413ms, lr: 9.75384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:30,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.66000 samples/s/p 3:12:43 } +2024-07-30 02:54:32,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1196/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 9.752767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:32,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.66076 samples/s/p 3:12:38 } +2024-07-30 02:54:35,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1198/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 9.751693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:35,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.65868 samples/s/p 3:12:40 } +2024-07-30 02:54:38,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1200/ 3125], loss: 0.244, per_step_time: 1414ms, lr: 9.750616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:38,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.65725 samples/s/p 3:12:40 } +2024-07-30 02:54:41,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1202/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 9.749538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:41,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.65898 samples/s/p 3:12:34 } +2024-07-30 02:54:44,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1204/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 9.748457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:44,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.66121 samples/s/p 3:12:26 } +2024-07-30 02:54:47,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1206/ 3125], loss: 0.336, per_step_time: 1414ms, lr: 9.747374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:47,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.65746 samples/s/p 3:12:31 } +2024-07-30 02:54:49,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1208/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 9.746288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:49,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.66049 samples/s/p 3:12:22 } +2024-07-30 02:54:52,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1210/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 9.7452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:52,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.66139 samples/s/p 3:12:17 } +2024-07-30 02:54:55,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1212/ 3125], loss: 0.112, per_step_time: 1413ms, lr: 9.744111e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:55,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.65808 samples/s/p 3:12:21 } +2024-07-30 02:54:58,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1214/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 9.7430175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:58,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.65991 samples/s/p 3:12:15 } +2024-07-30 02:55:01,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1216/ 3125], loss: 0.415, per_step_time: 1413ms, lr: 9.741923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:01,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.66130 samples/s/p 3:12:09 } +2024-07-30 02:55:04,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1218/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 9.7408265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:04,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.65964 samples/s/p 3:12:10 } +2024-07-30 02:55:06,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1220/ 3125], loss: 0.406, per_step_time: 1417ms, lr: 9.739729e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:06,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.64204 samples/s/p 3:12:43 } +2024-07-30 02:55:09,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1222/ 3125], loss: 0.280, per_step_time: 1416ms, lr: 9.738626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:09,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.64739 samples/s/p 3:12:29 } +2024-07-30 02:55:12,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1224/ 3125], loss: 0.308, per_step_time: 1426ms, lr: 9.737523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:12,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.60637 samples/s/p 3:13:51 } +2024-07-30 02:55:15,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1226/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 9.736417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:15,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.66149 samples/s/p 3:11:54 } +2024-07-30 02:55:18,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1228/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 9.7353095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:18,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.66065 samples/s/p 3:11:53 } +2024-07-30 02:55:21,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1230/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 9.734199e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:21,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.65951 samples/s/p 3:11:53 } +2024-07-30 02:55:23,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1232/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 9.733087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:23,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.65897 samples/s/p 3:11:51 } +2024-07-30 02:55:26,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1234/ 3125], loss: 0.403, per_step_time: 1414ms, lr: 9.731971e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:26,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.65576 samples/s/p 3:11:55 } +2024-07-30 02:55:29,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1236/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 9.730855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:29,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.65903 samples/s/p 3:11:45 } +2024-07-30 02:55:32,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1238/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 9.729735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:32,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.66019 samples/s/p 3:11:40 } +2024-07-30 02:55:35,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1240/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 9.728614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:35,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.66078 samples/s/p 3:11:36 } +2024-07-30 02:55:38,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1242/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 9.727489e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:38,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.65923 samples/s/p 3:11:36 } +2024-07-30 02:55:40,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1244/ 3125], loss: 0.158, per_step_time: 1413ms, lr: 9.726363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:40,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.66162 samples/s/p 3:11:29 } +2024-07-30 02:55:43,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1246/ 3125], loss: 0.466, per_step_time: 1414ms, lr: 9.725235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:43,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.65578 samples/s/p 3:11:38 } +2024-07-30 02:55:46,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1248/ 3125], loss: 0.301, per_step_time: 1413ms, lr: 9.7241045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:46,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.66109 samples/s/p 3:11:24 } +2024-07-30 02:55:49,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1250/ 3125], loss: 0.301, per_step_time: 1415ms, lr: 9.722971e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:49,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.65130 samples/s/p 3:11:41 } +2024-07-30 02:55:52,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1252/ 3125], loss: 0.246, per_step_time: 1415ms, lr: 9.721835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:52,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.65234 samples/s/p 3:11:36 } +2024-07-30 02:55:55,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1254/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 9.7206985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:55,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.65794 samples/s/p 3:11:22 } +2024-07-30 02:55:57,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1256/ 3125], loss: 0.186, per_step_time: 1412ms, lr: 9.719559e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:57,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.66217 samples/s/p 3:11:11 } +2024-07-30 02:56:00,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1258/ 3125], loss: 0.373, per_step_time: 1413ms, lr: 9.718417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:00,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.66032 samples/s/p 3:11:12 } +2024-07-30 02:56:03,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1260/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 9.717272e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:03,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.66058 samples/s/p 3:11:08 } +2024-07-30 02:56:06,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1262/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 9.716126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:06,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.66003 samples/s/p 3:11:07 } +2024-07-30 02:56:09,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1264/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 9.714978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:09,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.66152 samples/s/p 3:11:01 } +2024-07-30 02:56:12,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1266/ 3125], loss: 0.501, per_step_time: 1413ms, lr: 9.713827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:12,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.66061 samples/s/p 3:11:00 } +2024-07-30 02:56:14,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1268/ 3125], loss: 0.166, per_step_time: 1417ms, lr: 9.712674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:14,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.64224 samples/s/p 3:11:34 } +2024-07-30 02:56:17,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1270/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 9.711518e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:17,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.65920 samples/s/p 3:10:57 } +2024-07-30 02:56:20,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1272/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 9.71036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:20,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.65957 samples/s/p 3:10:53 } +2024-07-30 02:56:23,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1274/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 9.709201e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:23,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.65985 samples/s/p 3:10:50 } +2024-07-30 02:56:26,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1276/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 9.708038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:26,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.65979 samples/s/p 3:10:47 } +2024-07-30 02:56:29,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1278/ 3125], loss: 0.248, per_step_time: 1414ms, lr: 9.706873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:29,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.65685 samples/s/p 3:10:50 } +2024-07-30 02:56:31,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1280/ 3125], loss: 0.137, per_step_time: 1413ms, lr: 9.705706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:31,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.65778 samples/s/p 3:10:46 } +2024-07-30 02:56:34,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1282/ 3125], loss: 0.208, per_step_time: 1415ms, lr: 9.704539e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:34,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.65142 samples/s/p 3:10:56 } +2024-07-30 02:56:37,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1284/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 9.703367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:37,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.66051 samples/s/p 3:10:35 } +2024-07-30 02:56:40,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1286/ 3125], loss: 0.480, per_step_time: 1416ms, lr: 9.702194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:40,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.64852 samples/s/p 3:10:56 } +2024-07-30 02:56:43,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1288/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 9.701018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:43,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.66155 samples/s/p 3:10:27 } +2024-07-30 02:56:46,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1290/ 3125], loss: 0.396, per_step_time: 1412ms, lr: 9.69984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:46,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.66194 samples/s/p 3:10:23 } +2024-07-30 02:56:48,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1292/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 9.6986605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:48,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.66041 samples/s/p 3:10:23 } +2024-07-30 02:56:51,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1294/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 9.697477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:51,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.65811 samples/s/p 3:10:25 } +2024-07-30 02:56:54,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1296/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 9.696292e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:54,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.65793 samples/s/p 3:10:23 } +2024-07-30 02:56:57,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1298/ 3125], loss: 0.426, per_step_time: 1413ms, lr: 9.695105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:57,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.65977 samples/s/p 3:10:16 } +2024-07-30 02:57:00,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1300/ 3125], loss: 0.553, per_step_time: 1418ms, lr: 9.693917e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:00,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.64023 samples/s/p 3:10:53 } +2024-07-30 02:57:03,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1302/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 9.692725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:03,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.66031 samples/s/p 3:10:09 } +2024-07-30 02:57:05,991 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1304/ 3125], loss: 0.239, per_step_time: 1412ms, lr: 9.691531e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:05,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.66194 samples/s/p 3:10:03 } +2024-07-30 02:57:08,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1306/ 3125], loss: 0.382, per_step_time: 1413ms, lr: 9.690336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:08,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.66058 samples/s/p 3:10:03 } +2024-07-30 02:57:11,660 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1308/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 9.689138e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:11,660 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.65771 samples/s/p 3:10:06 } +2024-07-30 02:57:14,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1310/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 9.687938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:14,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.66060 samples/s/p 3:09:58 } +2024-07-30 02:57:17,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1312/ 3125], loss: 0.122, per_step_time: 1413ms, lr: 9.686734e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:17,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.66109 samples/s/p 3:09:54 } +2024-07-30 02:57:20,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1314/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 9.685529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:20,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |███████ | 5.66012 samples/s/p 3:09:53 } +2024-07-30 02:57:22,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1316/ 3125], loss: 0.242, per_step_time: 1414ms, lr: 9.684323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:22,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |███████ | 5.65493 samples/s/p 3:10:01 } +2024-07-30 02:57:25,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1318/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 9.683114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:25,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.66129 samples/s/p 3:09:45 } +2024-07-30 02:57:28,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1320/ 3125], loss: 0.338, per_step_time: 1414ms, lr: 9.681902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:28,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.65749 samples/s/p 3:09:50 } +2024-07-30 02:57:31,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1322/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 9.680688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:31,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.66053 samples/s/p 3:09:41 } +2024-07-30 02:57:34,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1324/ 3125], loss: 0.306, per_step_time: 1412ms, lr: 9.679472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:34,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.66210 samples/s/p 3:09:35 } +2024-07-30 02:57:37,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1326/ 3125], loss: 0.458, per_step_time: 1413ms, lr: 9.678254e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:37,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.66023 samples/s/p 3:09:36 } +2024-07-30 02:57:40,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1328/ 3125], loss: 0.322, per_step_time: 1414ms, lr: 9.677034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:40,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.65664 samples/s/p 3:09:40 } +2024-07-30 02:57:42,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1330/ 3125], loss: 0.384, per_step_time: 1413ms, lr: 9.67581e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:42,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.65820 samples/s/p 3:09:34 } +2024-07-30 02:57:45,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1332/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 9.674586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:45,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.66078 samples/s/p 3:09:26 } +2024-07-30 02:57:48,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1334/ 3125], loss: 0.160, per_step_time: 1413ms, lr: 9.673359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:48,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.66014 samples/s/p 3:09:25 } +2024-07-30 02:57:51,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1336/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 9.67213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:51,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.65526 samples/s/p 3:09:32 } +2024-07-30 02:57:54,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1338/ 3125], loss: 0.599, per_step_time: 1413ms, lr: 9.670897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:54,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.66013 samples/s/p 3:09:19 } +2024-07-30 02:57:57,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1340/ 3125], loss: 0.408, per_step_time: 1414ms, lr: 9.669664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:57,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.65440 samples/s/p 3:09:28 } +2024-07-30 02:57:59,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1342/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 9.668427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:59,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.66068 samples/s/p 3:09:12 } +2024-07-30 02:58:02,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1344/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 9.667189e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:02,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.65836 samples/s/p 3:09:14 } +2024-07-30 02:58:05,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1346/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 9.665949e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:05,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.66163 samples/s/p 3:09:05 } +2024-07-30 02:58:08,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1348/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 9.664705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:08,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.66134 samples/s/p 3:09:02 } +2024-07-30 02:58:11,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1350/ 3125], loss: 0.249, per_step_time: 1412ms, lr: 9.663461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:11,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.66405 samples/s/p 3:08:54 } +2024-07-30 02:58:14,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1352/ 3125], loss: 0.442, per_step_time: 1413ms, lr: 9.662214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:14,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.66116 samples/s/p 3:08:57 } +2024-07-30 02:58:16,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1354/ 3125], loss: 0.305, per_step_time: 1412ms, lr: 9.660965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:16,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.66195 samples/s/p 3:08:53 } +2024-07-30 02:58:19,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1356/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 9.659713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:19,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.65815 samples/s/p 3:08:57 } +2024-07-30 02:58:22,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1358/ 3125], loss: 0.118, per_step_time: 1413ms, lr: 9.658459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:22,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.66038 samples/s/p 3:08:50 } +2024-07-30 02:58:25,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1360/ 3125], loss: 0.098, per_step_time: 1412ms, lr: 9.657203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:25,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.66301 samples/s/p 3:08:42 } +2024-07-30 02:58:28,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1362/ 3125], loss: 0.471, per_step_time: 1413ms, lr: 9.655945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:28,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.65965 samples/s/p 3:08:46 } +2024-07-30 02:58:31,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1364/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 9.654684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:31,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.66110 samples/s/p 3:08:40 } +2024-07-30 02:58:33,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1366/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 9.65342e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:33,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.65807 samples/s/p 3:08:43 } +2024-07-30 02:58:36,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1368/ 3125], loss: 0.169, per_step_time: 1413ms, lr: 9.652156e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:36,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.65976 samples/s/p 3:08:37 } +2024-07-30 02:58:39,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1370/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 9.650888e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:39,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.66105 samples/s/p 3:08:32 } +2024-07-30 02:58:42,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1372/ 3125], loss: 0.273, per_step_time: 1412ms, lr: 9.64962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:42,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.66237 samples/s/p 3:08:26 } +2024-07-30 02:58:45,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1374/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 9.648348e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:45,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.66141 samples/s/p 3:08:26 } +2024-07-30 02:58:48,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1376/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 9.647073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:48,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.66068 samples/s/p 3:08:24 } +2024-07-30 02:58:50,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1378/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 9.645798e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:50,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.65797 samples/s/p 3:08:27 } +2024-07-30 02:58:53,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1380/ 3125], loss: 0.612, per_step_time: 1413ms, lr: 9.64452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:53,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.66056 samples/s/p 3:08:19 } +2024-07-30 02:58:56,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1382/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 9.643239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:56,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.65984 samples/s/p 3:08:17 } +2024-07-30 02:58:59,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1384/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 9.641956e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:59,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.65935 samples/s/p 3:08:16 } +2024-07-30 02:59:02,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1386/ 3125], loss: 0.271, per_step_time: 1415ms, lr: 9.640671e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:02,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.65198 samples/s/p 3:08:27 } +2024-07-30 02:59:05,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1388/ 3125], loss: 0.386, per_step_time: 1414ms, lr: 9.639384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:05,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.65730 samples/s/p 3:08:14 } +2024-07-30 02:59:07,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1390/ 3125], loss: 0.425, per_step_time: 1413ms, lr: 9.6380945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:07,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.66015 samples/s/p 3:08:05 } +2024-07-30 02:59:10,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1392/ 3125], loss: 0.252, per_step_time: 1416ms, lr: 9.636802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:10,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.64813 samples/s/p 3:08:27 } +2024-07-30 02:59:13,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1394/ 3125], loss: 0.226, per_step_time: 1414ms, lr: 9.635509e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:13,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.65661 samples/s/p 3:08:07 } +2024-07-30 02:59:16,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1396/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 9.634213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:16,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.66098 samples/s/p 3:07:55 } +2024-07-30 02:59:19,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1398/ 3125], loss: 0.431, per_step_time: 1413ms, lr: 9.632915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:19,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.66050 samples/s/p 3:07:53 } +2024-07-30 02:59:22,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1400/ 3125], loss: 0.280, per_step_time: 1414ms, lr: 9.6316135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:22,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.65757 samples/s/p 3:07:56 } +2024-07-30 02:59:22,059 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 02:59:56,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1402/ 3125], loss: 0.537, per_step_time: 2374ms, lr: 9.630311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:56,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 3.36955 samples/s/p 5:15:29 } +2024-07-30 02:59:59,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1404/ 3125], loss: 0.321, per_step_time: 1413ms, lr: 9.629006e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:59,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.65799 samples/s/p 3:07:50 } +2024-07-30 03:00:02,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1406/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 9.6277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:02,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.65855 samples/s/p 3:07:46 } +2024-07-30 03:00:05,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1408/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 9.62639e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:05,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.66081 samples/s/p 3:07:39 } +2024-07-30 03:00:08,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1410/ 3125], loss: 0.320, per_step_time: 1414ms, lr: 9.625078e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:08,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.65484 samples/s/p 3:07:48 } +2024-07-30 03:00:11,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1412/ 3125], loss: 0.263, per_step_time: 1415ms, lr: 9.6237645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:11,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.65153 samples/s/p 3:07:51 } +2024-07-30 03:00:14,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1414/ 3125], loss: 0.153, per_step_time: 1414ms, lr: 9.6224485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:14,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.65619 samples/s/p 3:07:39 } +2024-07-30 03:00:17,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1416/ 3125], loss: 0.109, per_step_time: 1413ms, lr: 9.621131e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:17,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.66096 samples/s/p 3:07:27 } +2024-07-30 03:00:19,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1418/ 3125], loss: 0.217, per_step_time: 1412ms, lr: 9.61981e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:19,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.66226 samples/s/p 3:07:22 } +2024-07-30 03:00:22,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1420/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 9.618488e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:22,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.66137 samples/s/p 3:07:21 } +2024-07-30 03:00:25,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1422/ 3125], loss: 0.702, per_step_time: 1413ms, lr: 9.617163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:25,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.66085 samples/s/p 3:07:19 } +2024-07-30 03:00:28,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1424/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 9.615836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:28,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.66000 samples/s/p 3:07:18 } +2024-07-30 03:00:31,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1426/ 3125], loss: 0.307, per_step_time: 1414ms, lr: 9.614508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:31,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.65653 samples/s/p 3:07:22 } +2024-07-30 03:00:34,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1428/ 3125], loss: 0.406, per_step_time: 1413ms, lr: 9.613175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:34,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.66046 samples/s/p 3:07:11 } +2024-07-30 03:00:36,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1430/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 9.611842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:36,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.66163 samples/s/p 3:07:06 } +2024-07-30 03:00:39,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1432/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 9.610506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:39,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.66007 samples/s/p 3:07:06 } +2024-07-30 03:00:42,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1434/ 3125], loss: 0.264, per_step_time: 1416ms, lr: 9.609167e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:42,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.64903 samples/s/p 3:07:25 } +2024-07-30 03:00:45,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1436/ 3125], loss: 0.493, per_step_time: 1413ms, lr: 9.607828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:45,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.66056 samples/s/p 3:07:00 } +2024-07-30 03:00:48,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1438/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 9.606485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:48,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.66078 samples/s/p 3:06:56 } +2024-07-30 03:00:51,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1440/ 3125], loss: 0.302, per_step_time: 1412ms, lr: 9.605141e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:51,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.66266 samples/s/p 3:06:50 } +2024-07-30 03:00:53,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1442/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 9.603795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:53,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.66071 samples/s/p 3:06:51 } +2024-07-30 03:00:56,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1444/ 3125], loss: 0.148, per_step_time: 1418ms, lr: 9.602445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:56,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.63992 samples/s/p 3:07:29 } +2024-07-30 03:00:59,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1446/ 3125], loss: 0.254, per_step_time: 1416ms, lr: 9.601094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:59,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.64667 samples/s/p 3:07:13 } +2024-07-30 03:01:02,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1448/ 3125], loss: 0.198, per_step_time: 1416ms, lr: 9.599741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:02,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.64880 samples/s/p 3:07:06 } +2024-07-30 03:01:05,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1450/ 3125], loss: 0.306, per_step_time: 1419ms, lr: 9.598385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:05,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.63489 samples/s/p 3:07:31 } +2024-07-30 03:01:08,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1452/ 3125], loss: 0.187, per_step_time: 1421ms, lr: 9.597027e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:08,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.62950 samples/s/p 3:07:39 } +2024-07-30 03:01:10,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1454/ 3125], loss: 0.147, per_step_time: 1419ms, lr: 9.595667e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:10,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.63660 samples/s/p 3:07:22 } +2024-07-30 03:01:13,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1456/ 3125], loss: 0.250, per_step_time: 1427ms, lr: 9.594305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:13,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.60545 samples/s/p 3:08:21 } +2024-07-30 03:01:16,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1458/ 3125], loss: 0.402, per_step_time: 1418ms, lr: 9.592941e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:16,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.63952 samples/s/p 3:07:10 } +2024-07-30 03:01:19,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1460/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 9.591575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:19,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.66045 samples/s/p 3:06:26 } +2024-07-30 03:01:22,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1462/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 9.590206e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:22,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.65892 samples/s/p 3:06:26 } +2024-07-30 03:01:25,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1464/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 9.588835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:25,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.65819 samples/s/p 3:06:25 } +2024-07-30 03:01:28,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1466/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 9.587462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:28,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.65862 samples/s/p 3:06:21 } +2024-07-30 03:01:30,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1468/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 9.586086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:30,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.65818 samples/s/p 3:06:19 } +2024-07-30 03:01:33,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1470/ 3125], loss: 0.303, per_step_time: 1414ms, lr: 9.584708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:33,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.65476 samples/s/p 3:06:23 } +2024-07-30 03:01:36,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1472/ 3125], loss: 0.148, per_step_time: 1413ms, lr: 9.583328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:36,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.65924 samples/s/p 3:06:11 } +2024-07-30 03:01:39,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1474/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 9.581947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:39,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.66066 samples/s/p 3:06:06 } +2024-07-30 03:01:42,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1476/ 3125], loss: 0.335, per_step_time: 1416ms, lr: 9.580563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:42,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.64839 samples/s/p 3:06:27 } +2024-07-30 03:01:45,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1478/ 3125], loss: 0.367, per_step_time: 1413ms, lr: 9.579177e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:45,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.65927 samples/s/p 3:06:03 } +2024-07-30 03:01:47,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1480/ 3125], loss: 0.177, per_step_time: 1418ms, lr: 9.577788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:47,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.63795 samples/s/p 3:06:42 } +2024-07-30 03:01:50,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1482/ 3125], loss: 0.156, per_step_time: 1421ms, lr: 9.576398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:50,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.62937 samples/s/p 3:06:56 } +2024-07-30 03:01:53,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1484/ 3125], loss: 0.288, per_step_time: 1414ms, lr: 9.575005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:53,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.65428 samples/s/p 3:06:04 } +2024-07-30 03:01:56,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1486/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 9.5736095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:56,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.65445 samples/s/p 3:06:01 } +2024-07-30 03:01:59,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1488/ 3125], loss: 0.203, per_step_time: 1416ms, lr: 9.572213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:59,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.64670 samples/s/p 3:06:13 } +2024-07-30 03:02:02,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1490/ 3125], loss: 0.331, per_step_time: 1412ms, lr: 9.570813e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:02,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.66239 samples/s/p 3:05:40 } +2024-07-30 03:02:04,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1492/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 9.569411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:04,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.66103 samples/s/p 3:05:40 } +2024-07-30 03:02:07,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1494/ 3125], loss: 0.445, per_step_time: 1413ms, lr: 9.568008e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:07,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.66113 samples/s/p 3:05:36 } +2024-07-30 03:02:10,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1496/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 9.566602e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:10,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |███████ | 5.65742 samples/s/p 3:05:41 } +2024-07-30 03:02:13,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1498/ 3125], loss: 0.205, per_step_time: 1414ms, lr: 9.565194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:13,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |███████ | 5.65560 samples/s/p 3:05:42 } +2024-07-30 03:02:16,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1500/ 3125], loss: 0.385, per_step_time: 1413ms, lr: 9.563783e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:16,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.65963 samples/s/p 3:05:31 } +2024-07-30 03:02:19,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1502/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 9.562372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:19,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.66019 samples/s/p 3:05:27 } +2024-07-30 03:02:21,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1504/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 9.560956e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:21,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.66107 samples/s/p 3:05:22 } +2024-07-30 03:02:24,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1506/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 9.55954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:24,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.66145 samples/s/p 3:05:19 } +2024-07-30 03:02:27,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1508/ 3125], loss: 0.276, per_step_time: 1414ms, lr: 9.558121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:27,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.65681 samples/s/p 3:05:25 } +2024-07-30 03:02:30,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1510/ 3125], loss: 0.249, per_step_time: 1416ms, lr: 9.556699e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:30,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.64857 samples/s/p 3:05:39 } +2024-07-30 03:02:33,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1512/ 3125], loss: 0.125, per_step_time: 1414ms, lr: 9.555276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:33,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.65758 samples/s/p 3:05:18 } +2024-07-30 03:02:36,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1514/ 3125], loss: 0.294, per_step_time: 1413ms, lr: 9.553851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:36,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.66011 samples/s/p 3:05:10 } +2024-07-30 03:02:38,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1516/ 3125], loss: 0.127, per_step_time: 1413ms, lr: 9.552423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:38,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.65937 samples/s/p 3:05:09 } +2024-07-30 03:02:41,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1518/ 3125], loss: 0.398, per_step_time: 1415ms, lr: 9.550993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:41,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.65291 samples/s/p 3:05:19 } +2024-07-30 03:02:44,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1520/ 3125], loss: 0.232, per_step_time: 1412ms, lr: 9.549562e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:44,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.66246 samples/s/p 3:04:57 } +2024-07-30 03:02:47,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1522/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 9.548126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:47,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.65868 samples/s/p 3:05:02 } +2024-07-30 03:02:50,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1524/ 3125], loss: 0.348, per_step_time: 1413ms, lr: 9.54669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:50,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.66013 samples/s/p 3:04:56 } +2024-07-30 03:02:53,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1526/ 3125], loss: 0.343, per_step_time: 1415ms, lr: 9.545252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:53,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.65250 samples/s/p 3:05:08 } +2024-07-30 03:02:55,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1528/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 9.543812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:55,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.65785 samples/s/p 3:04:55 } +2024-07-30 03:02:58,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1530/ 3125], loss: 0.642, per_step_time: 1413ms, lr: 9.542368e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:58,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.65993 samples/s/p 3:04:48 } +2024-07-30 03:03:01,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1532/ 3125], loss: 0.652, per_step_time: 1414ms, lr: 9.540923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:01,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.65461 samples/s/p 3:04:56 } +2024-07-30 03:03:04,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1534/ 3125], loss: 0.135, per_step_time: 1414ms, lr: 9.539476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:04,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.65452 samples/s/p 3:04:53 } +2024-07-30 03:03:07,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1536/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 9.5380265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:07,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.65955 samples/s/p 3:04:40 } +2024-07-30 03:03:10,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1538/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 9.536576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:10,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.66038 samples/s/p 3:04:36 } +2024-07-30 03:03:12,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1540/ 3125], loss: 0.369, per_step_time: 1412ms, lr: 9.5351215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:12,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.66201 samples/s/p 3:04:30 } +2024-07-30 03:03:15,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1542/ 3125], loss: 0.086, per_step_time: 1413ms, lr: 9.533665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:15,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.65971 samples/s/p 3:04:31 } +2024-07-30 03:03:18,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1544/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 9.532207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:18,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.66062 samples/s/p 3:04:27 } +2024-07-30 03:03:21,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1546/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 9.530747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:21,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.66169 samples/s/p 3:04:22 } +2024-07-30 03:03:24,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1548/ 3125], loss: 0.397, per_step_time: 1413ms, lr: 9.529285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:24,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.66046 samples/s/p 3:04:22 } +2024-07-30 03:03:27,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1550/ 3125], loss: 0.290, per_step_time: 1412ms, lr: 9.52782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:27,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.66264 samples/s/p 3:04:14 } +2024-07-30 03:03:29,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1552/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 9.526354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:29,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.66087 samples/s/p 3:04:15 } +2024-07-30 03:03:32,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1554/ 3125], loss: 0.239, per_step_time: 1414ms, lr: 9.524885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:32,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.65465 samples/s/p 3:04:24 } +2024-07-30 03:03:35,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1556/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 9.5234145e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:35,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.66043 samples/s/p 3:04:10 } +2024-07-30 03:03:38,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1558/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 9.52194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:38,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.65986 samples/s/p 3:04:09 } +2024-07-30 03:03:41,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1560/ 3125], loss: 0.159, per_step_time: 1412ms, lr: 9.520465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:41,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.66256 samples/s/p 3:04:00 } +2024-07-30 03:03:44,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1562/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 9.518988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:44,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.66027 samples/s/p 3:04:02 } +2024-07-30 03:03:46,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1564/ 3125], loss: 0.299, per_step_time: 1414ms, lr: 9.517508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:46,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.65734 samples/s/p 3:04:05 } +2024-07-30 03:03:49,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1566/ 3125], loss: 0.421, per_step_time: 1413ms, lr: 9.516027e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:49,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.65810 samples/s/p 3:04:01 } +2024-07-30 03:03:52,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1568/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 9.514542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:52,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.65806 samples/s/p 3:03:58 } +2024-07-30 03:03:55,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1570/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 9.513056e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:55,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.65874 samples/s/p 3:03:54 } +2024-07-30 03:03:58,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1572/ 3125], loss: 0.147, per_step_time: 1414ms, lr: 9.511568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:58,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.65494 samples/s/p 3:03:58 } +2024-07-30 03:04:01,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1574/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 9.510079e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:01,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.65799 samples/s/p 3:03:50 } +2024-07-30 03:04:04,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1576/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 9.508584e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:04,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.66149 samples/s/p 3:03:40 } +2024-07-30 03:04:06,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1578/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 9.50709e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:06,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.65945 samples/s/p 3:03:41 } +2024-07-30 03:04:09,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1580/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 9.505594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:09,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.65825 samples/s/p 3:03:41 } +2024-07-30 03:04:12,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1582/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 9.504094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:12,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.65840 samples/s/p 3:03:37 } +2024-07-30 03:04:15,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1584/ 3125], loss: 0.315, per_step_time: 1414ms, lr: 9.5025935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:15,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.65568 samples/s/p 3:03:40 } +2024-07-30 03:04:18,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1586/ 3125], loss: 0.383, per_step_time: 1416ms, lr: 9.50109e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:18,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.64876 samples/s/p 3:03:51 } +2024-07-30 03:04:21,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1588/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 9.499584e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:21,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.65967 samples/s/p 3:03:26 } +2024-07-30 03:04:23,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1590/ 3125], loss: 0.183, per_step_time: 1414ms, lr: 9.498076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:23,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.65414 samples/s/p 3:03:34 } +2024-07-30 03:04:26,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1592/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 9.496567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:26,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.66118 samples/s/p 3:03:18 } +2024-07-30 03:04:29,521 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1594/ 3125], loss: 0.227, per_step_time: 1414ms, lr: 9.495055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:29,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.65423 samples/s/p 3:03:29 } +2024-07-30 03:04:32,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1596/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 9.49354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:32,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.65835 samples/s/p 3:03:18 } +2024-07-30 03:04:35,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1598/ 3125], loss: 0.253, per_step_time: 1414ms, lr: 9.492024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:35,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.65417 samples/s/p 3:03:23 } +2024-07-30 03:04:38,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1600/ 3125], loss: 0.272, per_step_time: 1414ms, lr: 9.490506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:38,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.65728 samples/s/p 3:03:14 } +2024-07-30 03:04:40,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1602/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 9.488986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:40,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.66052 samples/s/p 3:03:05 } +2024-07-30 03:04:43,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1604/ 3125], loss: 0.450, per_step_time: 1412ms, lr: 9.487463e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:43,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.66318 samples/s/p 3:02:57 } +2024-07-30 03:04:46,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1606/ 3125], loss: 0.407, per_step_time: 1413ms, lr: 9.485938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:46,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.65980 samples/s/p 3:03:01 } +2024-07-30 03:04:49,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1608/ 3125], loss: 0.170, per_step_time: 1414ms, lr: 9.484411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:49,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.65631 samples/s/p 3:03:05 } +2024-07-30 03:04:52,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1610/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 9.482882e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:52,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.65882 samples/s/p 3:02:57 } +2024-07-30 03:04:55,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1612/ 3125], loss: 0.373, per_step_time: 1414ms, lr: 9.48135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:55,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.65764 samples/s/p 3:02:57 } +2024-07-30 03:04:57,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1614/ 3125], loss: 0.432, per_step_time: 1413ms, lr: 9.479818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:57,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.66134 samples/s/p 3:02:47 } +2024-07-30 03:05:00,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1616/ 3125], loss: 0.367, per_step_time: 1413ms, lr: 9.478282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:00,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.65896 samples/s/p 3:02:48 } +2024-07-30 03:05:03,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1618/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 9.476745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:03,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.65891 samples/s/p 3:02:46 } +2024-07-30 03:05:06,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1620/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 9.475205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:06,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.66133 samples/s/p 3:02:38 } +2024-07-30 03:05:09,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1622/ 3125], loss: 0.099, per_step_time: 1413ms, lr: 9.473662e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:09,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.66037 samples/s/p 3:02:37 } +2024-07-30 03:05:12,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1624/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 9.472118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:12,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.66113 samples/s/p 3:02:33 } +2024-07-30 03:05:14,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1626/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 9.470572e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:14,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.66092 samples/s/p 3:02:30 } +2024-07-30 03:05:17,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1628/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 9.469024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:17,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.66040 samples/s/p 3:02:29 } +2024-07-30 03:05:20,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1630/ 3125], loss: 0.332, per_step_time: 1412ms, lr: 9.467472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:20,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.66211 samples/s/p 3:02:22 } +2024-07-30 03:05:23,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1632/ 3125], loss: 0.266, per_step_time: 1412ms, lr: 9.465921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:23,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.66208 samples/s/p 3:02:20 } +2024-07-30 03:05:26,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1634/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 9.4643665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:26,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.65896 samples/s/p 3:02:23 } +2024-07-30 03:05:29,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1636/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 9.4628085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:29,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.66085 samples/s/p 3:02:16 } +2024-07-30 03:05:31,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1638/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 9.46125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:31,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.66029 samples/s/p 3:02:15 } +2024-07-30 03:05:34,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1640/ 3125], loss: 0.387, per_step_time: 1413ms, lr: 9.459689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:34,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.65980 samples/s/p 3:02:13 } +2024-07-30 03:05:37,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1642/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 9.4581255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:37,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.66042 samples/s/p 3:02:09 } +2024-07-30 03:05:40,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1644/ 3125], loss: 0.134, per_step_time: 1415ms, lr: 9.45656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:40,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.65206 samples/s/p 3:02:22 } +2024-07-30 03:05:43,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1646/ 3125], loss: 0.243, per_step_time: 1414ms, lr: 9.454992e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:43,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.65571 samples/s/p 3:02:12 } +2024-07-30 03:05:46,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1648/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 9.453423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:46,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.65840 samples/s/p 3:02:04 } +2024-07-30 03:05:48,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1650/ 3125], loss: 0.204, per_step_time: 1415ms, lr: 9.451852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:48,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.65310 samples/s/p 3:02:12 } +2024-07-30 03:05:51,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1652/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 9.450278e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:51,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.65997 samples/s/p 3:01:55 } +2024-07-30 03:05:54,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1654/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 9.448701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:54,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.66122 samples/s/p 3:01:50 } +2024-07-30 03:05:57,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1656/ 3125], loss: 0.512, per_step_time: 1413ms, lr: 9.447123e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:57,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.66095 samples/s/p 3:01:48 } +2024-07-30 03:06:00,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1658/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 9.445543e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:00,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.66071 samples/s/p 3:01:46 } +2024-07-30 03:06:03,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1660/ 3125], loss: 0.321, per_step_time: 1413ms, lr: 9.443961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:03,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.66167 samples/s/p 3:01:41 } +2024-07-30 03:06:05,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1662/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 9.442376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:05,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.66012 samples/s/p 3:01:41 } +2024-07-30 03:06:08,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1664/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 9.44079e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:08,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.65917 samples/s/p 3:01:40 } +2024-07-30 03:06:11,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1666/ 3125], loss: 0.313, per_step_time: 1412ms, lr: 9.439201e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:11,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.66377 samples/s/p 3:01:28 } +2024-07-30 03:06:14,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1668/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 9.43761e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:14,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.65834 samples/s/p 3:01:36 } +2024-07-30 03:06:17,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1670/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 9.436017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:17,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.66139 samples/s/p 3:01:27 } +2024-07-30 03:06:20,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1672/ 3125], loss: 0.287, per_step_time: 1414ms, lr: 9.434422e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:20,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.65618 samples/s/p 3:01:34 } +2024-07-30 03:06:22,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1674/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 9.432824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:22,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.65861 samples/s/p 3:01:27 } +2024-07-30 03:06:25,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1676/ 3125], loss: 0.317, per_step_time: 1412ms, lr: 9.431225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:25,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.66188 samples/s/p 3:01:18 } +2024-07-30 03:06:28,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1678/ 3125], loss: 0.519, per_step_time: 1413ms, lr: 9.429624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:28,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.65990 samples/s/p 3:01:19 } +2024-07-30 03:06:31,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1680/ 3125], loss: 0.228, per_step_time: 1414ms, lr: 9.42802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:31,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.65597 samples/s/p 3:01:24 } +2024-07-30 03:06:34,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1682/ 3125], loss: 0.395, per_step_time: 1414ms, lr: 9.426415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:34,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.65653 samples/s/p 3:01:20 } +2024-07-30 03:06:37,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1684/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 9.424806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:37,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |████████ | 5.65802 samples/s/p 3:01:14 } +2024-07-30 03:06:39,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1686/ 3125], loss: 0.527, per_step_time: 1412ms, lr: 9.423197e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:39,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |████████ | 5.66196 samples/s/p 3:01:04 } +2024-07-30 03:06:42,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1688/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 9.421586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:42,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.66037 samples/s/p 3:01:04 } +2024-07-30 03:06:45,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1690/ 3125], loss: 0.398, per_step_time: 1413ms, lr: 9.419971e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:45,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.65929 samples/s/p 3:01:03 } +2024-07-30 03:06:48,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1692/ 3125], loss: 0.388, per_step_time: 1413ms, lr: 9.418355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:48,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.66156 samples/s/p 3:00:56 } +2024-07-30 03:06:51,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1694/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 9.416737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:51,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.66017 samples/s/p 3:00:56 } +2024-07-30 03:06:54,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1696/ 3125], loss: 0.180, per_step_time: 1412ms, lr: 9.415116e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:54,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.66230 samples/s/p 3:00:49 } +2024-07-30 03:06:56,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1698/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 9.413494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:56,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.66039 samples/s/p 3:00:50 } +2024-07-30 03:06:59,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1700/ 3125], loss: 0.333, per_step_time: 1414ms, lr: 9.411869e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:59,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.65707 samples/s/p 3:00:53 } +2024-07-30 03:07:02,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1702/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 9.410242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:02,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.65970 samples/s/p 3:00:45 } +2024-07-30 03:07:05,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1704/ 3125], loss: 0.429, per_step_time: 1414ms, lr: 9.408614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:05,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.65707 samples/s/p 3:00:48 } +2024-07-30 03:07:08,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1706/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 9.406983e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:08,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.66097 samples/s/p 3:00:37 } +2024-07-30 03:07:11,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1708/ 3125], loss: 0.098, per_step_time: 1414ms, lr: 9.4053485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:11,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.65683 samples/s/p 3:00:42 } +2024-07-30 03:07:13,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1710/ 3125], loss: 0.097, per_step_time: 1413ms, lr: 9.403714e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:13,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.66018 samples/s/p 3:00:33 } +2024-07-30 03:07:16,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1712/ 3125], loss: 0.343, per_step_time: 1412ms, lr: 9.402076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:16,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.66176 samples/s/p 3:00:27 } +2024-07-30 03:07:19,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1714/ 3125], loss: 0.400, per_step_time: 1413ms, lr: 9.400437e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:19,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.65954 samples/s/p 3:00:29 } +2024-07-30 03:07:22,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1716/ 3125], loss: 0.209, per_step_time: 1412ms, lr: 9.398796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:22,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.66266 samples/s/p 3:00:20 } +2024-07-30 03:07:25,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1718/ 3125], loss: 0.398, per_step_time: 1413ms, lr: 9.397152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:25,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.65952 samples/s/p 3:00:23 } +2024-07-30 03:07:28,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1720/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 9.395506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:28,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.65949 samples/s/p 3:00:20 } +2024-07-30 03:07:30,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1722/ 3125], loss: 0.214, per_step_time: 1414ms, lr: 9.393859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:30,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.65500 samples/s/p 3:00:26 } +2024-07-30 03:07:33,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1724/ 3125], loss: 0.141, per_step_time: 1414ms, lr: 9.392209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:33,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.65553 samples/s/p 3:00:22 } +2024-07-30 03:07:36,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1726/ 3125], loss: 0.149, per_step_time: 1417ms, lr: 9.390556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:36,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.64380 samples/s/p 3:00:42 } +2024-07-30 03:07:39,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1728/ 3125], loss: 0.275, per_step_time: 1414ms, lr: 9.388902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:39,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.65711 samples/s/p 3:00:14 } +2024-07-30 03:07:42,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1730/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 9.387246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:42,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.66100 samples/s/p 3:00:03 } +2024-07-30 03:07:45,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1732/ 3125], loss: 0.168, per_step_time: 1414ms, lr: 9.385587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:45,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.65622 samples/s/p 3:00:10 } +2024-07-30 03:07:47,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1734/ 3125], loss: 0.273, per_step_time: 1414ms, lr: 9.383927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:47,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.65625 samples/s/p 3:00:07 } +2024-07-30 03:07:50,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1736/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 9.382265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:50,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.66095 samples/s/p 2:59:55 } +2024-07-30 03:07:53,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1738/ 3125], loss: 0.343, per_step_time: 1414ms, lr: 9.380601e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:53,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.65647 samples/s/p 3:00:01 } +2024-07-30 03:07:56,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1740/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 9.378934e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:56,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.66014 samples/s/p 2:59:51 } +2024-07-30 03:07:59,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1742/ 3125], loss: 0.164, per_step_time: 1415ms, lr: 9.377265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:59,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.65312 samples/s/p 3:00:01 } +2024-07-30 03:08:02,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1744/ 3125], loss: 0.365, per_step_time: 1412ms, lr: 9.375594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:02,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.66283 samples/s/p 2:59:40 } +2024-07-30 03:08:04,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1746/ 3125], loss: 0.208, per_step_time: 1412ms, lr: 9.373922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:04,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.66281 samples/s/p 2:59:37 } +2024-07-30 03:08:07,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1748/ 3125], loss: 0.301, per_step_time: 1414ms, lr: 9.3722465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:07,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.65635 samples/s/p 2:59:47 } +2024-07-30 03:08:10,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1750/ 3125], loss: 0.379, per_step_time: 1412ms, lr: 9.3705685e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:10,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.66198 samples/s/p 2:59:33 } +2024-07-30 03:08:13,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1752/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 9.3688905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:13,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.66107 samples/s/p 2:59:32 } +2024-07-30 03:08:16,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1754/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 9.367209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:16,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.66043 samples/s/p 2:59:30 } +2024-07-30 03:08:19,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1756/ 3125], loss: 0.423, per_step_time: 1413ms, lr: 9.365525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:19,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.65829 samples/s/p 2:59:32 } +2024-07-30 03:08:21,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1758/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 9.363841e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:21,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.66073 samples/s/p 2:59:24 } +2024-07-30 03:08:24,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1760/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 9.362153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:24,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.66160 samples/s/p 2:59:20 } +2024-07-30 03:08:27,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1762/ 3125], loss: 0.590, per_step_time: 1413ms, lr: 9.360463e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:27,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.65997 samples/s/p 2:59:20 } +2024-07-30 03:08:30,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1764/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 9.358771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:30,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.65831 samples/s/p 2:59:20 } +2024-07-30 03:08:33,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1766/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 9.357077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:33,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.66098 samples/s/p 2:59:12 } +2024-07-30 03:08:36,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1768/ 3125], loss: 0.256, per_step_time: 1417ms, lr: 9.355382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:36,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.64370 samples/s/p 2:59:43 } +2024-07-30 03:08:38,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1770/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 9.353684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:38,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.66128 samples/s/p 2:59:06 } +2024-07-30 03:08:41,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1772/ 3125], loss: 0.327, per_step_time: 1412ms, lr: 9.351984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:41,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.66208 samples/s/p 2:59:02 } +2024-07-30 03:08:44,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1774/ 3125], loss: 0.134, per_step_time: 1413ms, lr: 9.350281e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:44,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.65920 samples/s/p 2:59:04 } +2024-07-30 03:08:47,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1776/ 3125], loss: 0.391, per_step_time: 1412ms, lr: 9.348578e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:47,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.66209 samples/s/p 2:58:56 } +2024-07-30 03:08:50,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1778/ 3125], loss: 0.383, per_step_time: 1413ms, lr: 9.346872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:50,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.66102 samples/s/p 2:58:55 } +2024-07-30 03:08:53,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1780/ 3125], loss: 0.366, per_step_time: 1412ms, lr: 9.345163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:53,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.66323 samples/s/p 2:58:48 } +2024-07-30 03:08:55,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1782/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 9.343452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:55,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.65907 samples/s/p 2:58:53 } +2024-07-30 03:08:58,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1784/ 3125], loss: 0.436, per_step_time: 1413ms, lr: 9.341739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:58,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.65940 samples/s/p 2:58:50 } +2024-07-30 03:09:01,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1786/ 3125], loss: 0.294, per_step_time: 1414ms, lr: 9.340025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:01,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.65526 samples/s/p 2:58:55 } +2024-07-30 03:09:04,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1788/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 9.338309e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:04,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.65859 samples/s/p 2:58:46 } +2024-07-30 03:09:07,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1790/ 3125], loss: 0.432, per_step_time: 1413ms, lr: 9.33659e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:07,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.65852 samples/s/p 2:58:43 } +2024-07-30 03:09:10,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1792/ 3125], loss: 0.356, per_step_time: 1413ms, lr: 9.334869e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:10,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.65806 samples/s/p 2:58:41 } +2024-07-30 03:09:12,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1794/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 9.333146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:12,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.65943 samples/s/p 2:58:36 } +2024-07-30 03:09:15,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1796/ 3125], loss: 0.225, per_step_time: 1414ms, lr: 9.331422e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:15,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.65658 samples/s/p 2:58:38 } +2024-07-30 03:09:18,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1798/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 9.329694e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:18,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.65840 samples/s/p 2:58:32 } +2024-07-30 03:09:21,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1800/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 9.327966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:21,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.65887 samples/s/p 2:58:28 } +2024-07-30 03:09:24,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1802/ 3125], loss: 0.242, per_step_time: 1414ms, lr: 9.326234e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:24,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.65635 samples/s/p 2:58:30 } +2024-07-30 03:09:27,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1804/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 9.324502e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:27,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.66068 samples/s/p 2:58:19 } +2024-07-30 03:09:29,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1806/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 9.322765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:29,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.65990 samples/s/p 2:58:18 } +2024-07-30 03:09:32,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1808/ 3125], loss: 0.160, per_step_time: 1413ms, lr: 9.321029e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:32,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.65784 samples/s/p 2:58:19 } +2024-07-30 03:09:35,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1810/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 9.319289e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:35,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.66037 samples/s/p 2:58:11 } +2024-07-30 03:09:38,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1812/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 9.317549e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:38,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.65918 samples/s/p 2:58:11 } +2024-07-30 03:09:41,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1814/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 9.315804e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:41,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.66030 samples/s/p 2:58:06 } +2024-07-30 03:09:44,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1816/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 9.314059e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:44,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.66050 samples/s/p 2:58:03 } +2024-07-30 03:09:46,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1818/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 9.312312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:46,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.65792 samples/s/p 2:58:05 } +2024-07-30 03:09:49,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1820/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 9.310561e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:49,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.66132 samples/s/p 2:57:55 } +2024-07-30 03:09:52,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1822/ 3125], loss: 0.357, per_step_time: 1413ms, lr: 9.30881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:52,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.66025 samples/s/p 2:57:55 } +2024-07-30 03:09:55,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1824/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 9.307057e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:55,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.66115 samples/s/p 2:57:50 } +2024-07-30 03:09:58,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1826/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 9.3053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:58,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.65927 samples/s/p 2:57:51 } +2024-07-30 03:10:01,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1828/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 9.303542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:01,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.66066 samples/s/p 2:57:45 } +2024-07-30 03:10:03,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1830/ 3125], loss: 0.334, per_step_time: 1413ms, lr: 9.3017825e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:03,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.66000 samples/s/p 2:57:44 } +2024-07-30 03:10:06,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1832/ 3125], loss: 0.160, per_step_time: 1414ms, lr: 9.300021e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:06,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.65518 samples/s/p 2:57:50 } +2024-07-30 03:10:09,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1834/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 9.298256e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:09,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.65815 samples/s/p 2:57:42 } +2024-07-30 03:10:12,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1836/ 3125], loss: 0.311, per_step_time: 1412ms, lr: 9.296491e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:12,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.66187 samples/s/p 2:57:32 } +2024-07-30 03:10:15,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1838/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 9.294722e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:15,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.66034 samples/s/p 2:57:32 } +2024-07-30 03:10:18,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1840/ 3125], loss: 0.365, per_step_time: 1412ms, lr: 9.292952e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:18,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.66218 samples/s/p 2:57:26 } +2024-07-30 03:10:20,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1842/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 9.2911805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:20,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.65932 samples/s/p 2:57:28 } +2024-07-30 03:10:23,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1844/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 9.289406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:23,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.66097 samples/s/p 2:57:22 } +2024-07-30 03:10:26,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1846/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 9.28763e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:26,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.65895 samples/s/p 2:57:23 } +2024-07-30 03:10:29,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1848/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 9.285851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:29,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.66004 samples/s/p 2:57:18 } +2024-07-30 03:10:32,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1850/ 3125], loss: 0.507, per_step_time: 1413ms, lr: 9.28407e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:32,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.65929 samples/s/p 2:57:17 } +2024-07-30 03:10:35,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1852/ 3125], loss: 0.280, per_step_time: 1414ms, lr: 9.282288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:35,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.65610 samples/s/p 2:57:20 } +2024-07-30 03:10:37,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1854/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 9.280503e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:37,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.65782 samples/s/p 2:57:14 } +2024-07-30 03:10:40,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1856/ 3125], loss: 0.386, per_step_time: 1412ms, lr: 9.278717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:40,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.66197 samples/s/p 2:57:03 } +2024-07-30 03:10:43,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1858/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 9.276928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:43,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.65831 samples/s/p 2:57:07 } +2024-07-30 03:10:46,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1860/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 9.275138e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:46,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.65934 samples/s/p 2:57:03 } +2024-07-30 03:10:49,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1862/ 3125], loss: 0.399, per_step_time: 1413ms, lr: 9.273345e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:49,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.66016 samples/s/p 2:56:58 } +2024-07-30 03:10:52,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1864/ 3125], loss: 0.226, per_step_time: 1412ms, lr: 9.271551e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:52,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.66174 samples/s/p 2:56:52 } +2024-07-30 03:10:54,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1866/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 9.269754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:54,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.65954 samples/s/p 2:56:54 } +2024-07-30 03:10:57,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1868/ 3125], loss: 0.055, per_step_time: 1414ms, lr: 9.267955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:57,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.65553 samples/s/p 2:56:58 } +2024-07-30 03:11:00,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1870/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 9.266154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:00,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.66143 samples/s/p 2:56:45 } +2024-07-30 03:11:03,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1872/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 9.264351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:03,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |█████████ | 5.65908 samples/s/p 2:56:46 } +2024-07-30 03:11:06,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1874/ 3125], loss: 0.366, per_step_time: 1414ms, lr: 9.262546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:06,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |█████████ | 5.65607 samples/s/p 2:56:49 } +2024-07-30 03:11:09,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1876/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 9.260739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:09,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.65966 samples/s/p 2:56:39 } +2024-07-30 03:11:11,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1878/ 3125], loss: 0.410, per_step_time: 1414ms, lr: 9.258931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:11,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.65428 samples/s/p 2:56:47 } +2024-07-30 03:11:14,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1880/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 9.257119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:14,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.66152 samples/s/p 2:56:30 } +2024-07-30 03:11:17,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1882/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 9.255306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:17,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.65826 samples/s/p 2:56:34 } +2024-07-30 03:11:20,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1884/ 3125], loss: 0.320, per_step_time: 1416ms, lr: 9.253491e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:20,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.64890 samples/s/p 2:56:48 } +2024-07-30 03:11:23,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1886/ 3125], loss: 0.366, per_step_time: 1424ms, lr: 9.251674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:23,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.61411 samples/s/p 2:57:51 } +2024-07-30 03:11:26,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1888/ 3125], loss: 0.145, per_step_time: 1414ms, lr: 9.249855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:26,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.65683 samples/s/p 2:56:28 } +2024-07-30 03:11:29,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1890/ 3125], loss: 0.278, per_step_time: 1412ms, lr: 9.248033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:29,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.66173 samples/s/p 2:56:16 } +2024-07-30 03:11:31,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1892/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 9.24621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:31,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.66035 samples/s/p 2:56:16 } +2024-07-30 03:11:34,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1894/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 9.244384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:34,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.66114 samples/s/p 2:56:11 } +2024-07-30 03:11:37,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1896/ 3125], loss: 0.125, per_step_time: 1413ms, lr: 9.242558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:37,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.65976 samples/s/p 2:56:11 } +2024-07-30 03:11:40,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1898/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 9.240728e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:40,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.65806 samples/s/p 2:56:11 } +2024-07-30 03:11:43,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1900/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 9.238896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:43,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.66144 samples/s/p 2:56:02 } +2024-07-30 03:11:46,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1902/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 9.237063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:46,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.65902 samples/s/p 2:56:04 } +2024-07-30 03:11:48,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1904/ 3125], loss: 0.442, per_step_time: 1413ms, lr: 9.235228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:48,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.65997 samples/s/p 2:55:59 } +2024-07-30 03:11:51,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1906/ 3125], loss: 0.151, per_step_time: 1413ms, lr: 9.233391e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:51,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.66158 samples/s/p 2:55:53 } +2024-07-30 03:11:54,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1908/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 9.231551e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:54,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.66157 samples/s/p 2:55:51 } +2024-07-30 03:11:57,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1910/ 3125], loss: 0.381, per_step_time: 1413ms, lr: 9.22971e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:57,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.65940 samples/s/p 2:55:52 } +2024-07-30 03:12:00,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1912/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 9.227867e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:00,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.66119 samples/s/p 2:55:46 } +2024-07-30 03:12:03,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1914/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 9.226022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:03,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.66067 samples/s/p 2:55:44 } +2024-07-30 03:12:05,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1916/ 3125], loss: 0.279, per_step_time: 1412ms, lr: 9.2241735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:05,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.66228 samples/s/p 2:55:38 } +2024-07-30 03:12:08,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1918/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 9.222324e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:08,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.65984 samples/s/p 2:55:40 } +2024-07-30 03:12:11,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1920/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 9.220473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:11,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.66067 samples/s/p 2:55:35 } +2024-07-30 03:12:14,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1922/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 9.218618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:14,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.66016 samples/s/p 2:55:33 } +2024-07-30 03:12:17,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1924/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 9.216764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:17,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.66079 samples/s/p 2:55:29 } +2024-07-30 03:12:20,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1926/ 3125], loss: 0.110, per_step_time: 1413ms, lr: 9.214905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:20,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.66072 samples/s/p 2:55:27 } +2024-07-30 03:12:22,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1928/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 9.213046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:22,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.65895 samples/s/p 2:55:27 } +2024-07-30 03:12:25,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1930/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 9.211185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:25,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.66097 samples/s/p 2:55:21 } +2024-07-30 03:12:28,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1932/ 3125], loss: 0.282, per_step_time: 1414ms, lr: 9.209321e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:28,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.65438 samples/s/p 2:55:30 } +2024-07-30 03:12:31,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1934/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 9.207456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:31,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.66139 samples/s/p 2:55:14 } +2024-07-30 03:12:34,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1936/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 9.205588e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:34,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.65927 samples/s/p 2:55:15 } +2024-07-30 03:12:37,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1938/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 9.203719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:37,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.65978 samples/s/p 2:55:12 } +2024-07-30 03:12:39,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1940/ 3125], loss: 0.444, per_step_time: 1414ms, lr: 9.201847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:39,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.65580 samples/s/p 2:55:16 } +2024-07-30 03:12:42,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1942/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 9.199974e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:42,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.65709 samples/s/p 2:55:11 } +2024-07-30 03:12:45,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1944/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 9.198097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:45,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.66146 samples/s/p 2:55:00 } +2024-07-30 03:12:48,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1946/ 3125], loss: 0.379, per_step_time: 1413ms, lr: 9.19622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:48,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.65925 samples/s/p 2:55:01 } +2024-07-30 03:12:51,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1948/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 9.19434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:51,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.65976 samples/s/p 2:54:57 } +2024-07-30 03:12:54,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1950/ 3125], loss: 0.079, per_step_time: 1413ms, lr: 9.192459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:54,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.65849 samples/s/p 2:54:57 } +2024-07-30 03:12:56,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1952/ 3125], loss: 0.346, per_step_time: 1414ms, lr: 9.190576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:56,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.65681 samples/s/p 2:54:57 } +2024-07-30 03:12:59,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1954/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 9.18869e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:59,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.65909 samples/s/p 2:54:50 } +2024-07-30 03:13:02,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1956/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 9.186801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:02,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.66044 samples/s/p 2:54:45 } +2024-07-30 03:13:05,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1958/ 3125], loss: 0.354, per_step_time: 1412ms, lr: 9.184912e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:05,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.66304 samples/s/p 2:54:37 } +2024-07-30 03:13:08,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1960/ 3125], loss: 0.174, per_step_time: 1412ms, lr: 9.183021e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:08,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.66238 samples/s/p 2:54:36 } +2024-07-30 03:13:11,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1962/ 3125], loss: 0.341, per_step_time: 1414ms, lr: 9.181127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:11,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.65681 samples/s/p 2:54:43 } +2024-07-30 03:13:13,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1964/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 9.179231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:13,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.66033 samples/s/p 2:54:34 } +2024-07-30 03:13:16,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1966/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 9.1773345e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:16,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.66087 samples/s/p 2:54:30 } +2024-07-30 03:13:19,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1968/ 3125], loss: 0.075, per_step_time: 1413ms, lr: 9.175434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:19,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.65983 samples/s/p 2:54:29 } +2024-07-30 03:13:22,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1970/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 9.173533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:22,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.66094 samples/s/p 2:54:24 } +2024-07-30 03:13:25,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1972/ 3125], loss: 0.377, per_step_time: 1413ms, lr: 9.171628e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:25,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.66103 samples/s/p 2:54:21 } +2024-07-30 03:13:28,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1974/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 9.169723e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:28,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.66030 samples/s/p 2:54:20 } +2024-07-30 03:13:30,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1976/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 9.167815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:30,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.66072 samples/s/p 2:54:16 } +2024-07-30 03:13:33,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1978/ 3125], loss: 0.148, per_step_time: 1414ms, lr: 9.165906e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:33,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.65740 samples/s/p 2:54:19 } +2024-07-30 03:13:36,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1980/ 3125], loss: 0.399, per_step_time: 1413ms, lr: 9.163994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:36,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.66070 samples/s/p 2:54:10 } +2024-07-30 03:13:39,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1982/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 9.1620805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:39,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.65838 samples/s/p 2:54:12 } +2024-07-30 03:13:42,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1984/ 3125], loss: 0.318, per_step_time: 1412ms, lr: 9.160166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:42,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.66195 samples/s/p 2:54:03 } +2024-07-30 03:13:45,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1986/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 9.158248e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:45,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.66078 samples/s/p 2:54:02 } +2024-07-30 03:13:47,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1988/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 9.156328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:47,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.66032 samples/s/p 2:54:00 } +2024-07-30 03:13:50,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1990/ 3125], loss: 0.410, per_step_time: 1412ms, lr: 9.154406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:50,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.66201 samples/s/p 2:53:54 } +2024-07-30 03:13:53,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1992/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 9.1524835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:53,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.66131 samples/s/p 2:53:52 } +2024-07-30 03:13:56,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1994/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 9.150557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:56,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.66033 samples/s/p 2:53:51 } +2024-07-30 03:13:59,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1996/ 3125], loss: 0.112, per_step_time: 1412ms, lr: 9.14863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:59,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.66207 samples/s/p 2:53:45 } +2024-07-30 03:14:02,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1998/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 9.1467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:02,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.66071 samples/s/p 2:53:45 } +2024-07-30 03:14:04,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2000/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 9.144769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:04,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.66124 samples/s/p 2:53:41 } +2024-07-30 03:14:07,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2002/ 3125], loss: 0.148, per_step_time: 1414ms, lr: 9.1428365e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:07,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.65729 samples/s/p 2:53:46 } +2024-07-30 03:14:10,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2004/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 9.140901e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:10,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.65988 samples/s/p 2:53:38 } +2024-07-30 03:14:13,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2006/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 9.138963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:13,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.66109 samples/s/p 2:53:33 } +2024-07-30 03:14:16,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2008/ 3125], loss: 0.285, per_step_time: 1414ms, lr: 9.137024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:16,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.65475 samples/s/p 2:53:42 } +2024-07-30 03:14:19,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2010/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 9.135083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:19,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.65870 samples/s/p 2:53:32 } +2024-07-30 03:14:21,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2012/ 3125], loss: 0.333, per_step_time: 1412ms, lr: 9.1331385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:21,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.66234 samples/s/p 2:53:22 } +2024-07-30 03:14:24,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2014/ 3125], loss: 0.167, per_step_time: 1414ms, lr: 9.131193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:24,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.65496 samples/s/p 2:53:33 } +2024-07-30 03:14:27,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2016/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 9.129246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:27,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.65857 samples/s/p 2:53:24 } +2024-07-30 03:14:30,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2018/ 3125], loss: 0.382, per_step_time: 1414ms, lr: 9.127297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:30,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.65614 samples/s/p 2:53:25 } +2024-07-30 03:14:33,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2020/ 3125], loss: 0.444, per_step_time: 1412ms, lr: 9.125346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:33,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.66236 samples/s/p 2:53:11 } +2024-07-30 03:14:36,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2022/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 9.123393e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:36,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.65906 samples/s/p 2:53:14 } +2024-07-30 03:14:38,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2024/ 3125], loss: 0.321, per_step_time: 1414ms, lr: 9.121438e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:38,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.65665 samples/s/p 2:53:16 } +2024-07-30 03:14:41,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2026/ 3125], loss: 0.168, per_step_time: 1414ms, lr: 9.119481e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:41,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.65759 samples/s/p 2:53:11 } +2024-07-30 03:14:44,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2028/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 9.117522e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:44,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.65863 samples/s/p 2:53:06 } +2024-07-30 03:14:47,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2030/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 9.11556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:47,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.66058 samples/s/p 2:53:00 } +2024-07-30 03:14:50,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2032/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 9.113598e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:50,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.65911 samples/s/p 2:53:00 } +2024-07-30 03:14:53,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2034/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 9.1116335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:53,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.65847 samples/s/p 2:52:58 } +2024-07-30 03:14:55,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2036/ 3125], loss: 0.398, per_step_time: 1413ms, lr: 9.109666e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:55,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.66045 samples/s/p 2:52:52 } +2024-07-30 03:14:58,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2038/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 9.107697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:58,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.65798 samples/s/p 2:52:54 } +2024-07-30 03:15:01,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2040/ 3125], loss: 0.238, per_step_time: 1414ms, lr: 9.105726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:01,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.65645 samples/s/p 2:52:53 } +2024-07-30 03:15:04,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2042/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 9.103754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:04,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.66127 samples/s/p 2:52:42 } +2024-07-30 03:15:07,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2044/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 9.101778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:07,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.65958 samples/s/p 2:52:42 } +2024-07-30 03:15:10,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2046/ 3125], loss: 0.397, per_step_time: 1413ms, lr: 9.099802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:10,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.66166 samples/s/p 2:52:35 } +2024-07-30 03:15:12,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2048/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 9.097823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:12,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.66142 samples/s/p 2:52:33 } +2024-07-30 03:15:15,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2050/ 3125], loss: 0.395, per_step_time: 1412ms, lr: 9.095843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:15,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.66175 samples/s/p 2:52:30 } +2024-07-30 03:15:18,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2052/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 9.09386e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:18,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.65849 samples/s/p 2:52:33 } +2024-07-30 03:15:21,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2054/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 9.091876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:21,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.66154 samples/s/p 2:52:24 } +2024-07-30 03:15:24,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2056/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 9.089889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:24,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.66023 samples/s/p 2:52:24 } +2024-07-30 03:15:27,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2058/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 9.0879e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:27,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.66113 samples/s/p 2:52:19 } +2024-07-30 03:15:29,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2060/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 9.08591e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:29,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.65938 samples/s/p 2:52:20 } +2024-07-30 03:15:32,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2062/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 9.0839185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:32,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.66137 samples/s/p 2:52:13 } +2024-07-30 03:15:35,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2064/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 9.081924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:35,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |███████████ | 5.65980 samples/s/p 2:52:13 } +2024-07-30 03:15:38,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2066/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 9.079927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:38,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |███████████ | 5.65815 samples/s/p 2:52:14 } +2024-07-30 03:15:41,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2068/ 3125], loss: 0.349, per_step_time: 1413ms, lr: 9.0779295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:41,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.65791 samples/s/p 2:52:11 } +2024-07-30 03:15:44,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2070/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 9.0759295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:44,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.66142 samples/s/p 2:52:02 } +2024-07-30 03:15:46,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2072/ 3125], loss: 0.483, per_step_time: 1413ms, lr: 9.073927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:46,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.65874 samples/s/p 2:52:04 } +2024-07-30 03:15:49,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2074/ 3125], loss: 0.206, per_step_time: 1415ms, lr: 9.071923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:49,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.65309 samples/s/p 2:52:12 } +2024-07-30 03:15:52,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2076/ 3125], loss: 0.231, per_step_time: 1412ms, lr: 9.069917e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:52,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.66183 samples/s/p 2:51:53 } +2024-07-30 03:15:55,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2078/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 9.06791e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:55,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.66132 samples/s/p 2:51:51 } +2024-07-30 03:15:58,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2080/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 9.0659e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:58,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.66154 samples/s/p 2:51:48 } +2024-07-30 03:16:01,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2082/ 3125], loss: 0.082, per_step_time: 1414ms, lr: 9.063888e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:01,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.65642 samples/s/p 2:51:54 } +2024-07-30 03:16:03,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2084/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 9.061873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:03,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.66003 samples/s/p 2:51:45 } +2024-07-30 03:16:06,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2086/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 9.059858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:06,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.66018 samples/s/p 2:51:42 } +2024-07-30 03:16:09,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2088/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 9.0578405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:09,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.65952 samples/s/p 2:51:40 } +2024-07-30 03:16:12,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2090/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 9.0558215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:12,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.66049 samples/s/p 2:51:35 } +2024-07-30 03:16:15,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2092/ 3125], loss: 0.397, per_step_time: 1413ms, lr: 9.0538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:15,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.65972 samples/s/p 2:51:34 } +2024-07-30 03:16:18,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2094/ 3125], loss: 0.323, per_step_time: 1412ms, lr: 9.051776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:18,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.66178 samples/s/p 2:51:27 } +2024-07-30 03:16:20,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2096/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 9.049751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:20,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.66092 samples/s/p 2:51:26 } +2024-07-30 03:16:23,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2098/ 3125], loss: 0.217, per_step_time: 1414ms, lr: 9.047724e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:23,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.65554 samples/s/p 2:51:33 } +2024-07-30 03:16:26,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2100/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 9.045693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:26,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.66163 samples/s/p 2:51:19 } +2024-07-30 03:16:29,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2102/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 9.043662e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:29,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.66069 samples/s/p 2:51:18 } +2024-07-30 03:16:32,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2104/ 3125], loss: 0.235, per_step_time: 1414ms, lr: 9.04163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:32,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.65542 samples/s/p 2:51:25 } +2024-07-30 03:16:35,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2106/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 9.039595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:35,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.66139 samples/s/p 2:51:11 } +2024-07-30 03:16:37,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2108/ 3125], loss: 0.154, per_step_time: 1414ms, lr: 9.037558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:37,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.65655 samples/s/p 2:51:17 } +2024-07-30 03:16:40,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2110/ 3125], loss: 0.134, per_step_time: 1412ms, lr: 9.035519e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:40,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.66263 samples/s/p 2:51:03 } +2024-07-30 03:16:43,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2112/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 9.033478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:43,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.65847 samples/s/p 2:51:08 } +2024-07-30 03:16:46,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2114/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 9.031435e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:46,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.65868 samples/s/p 2:51:05 } +2024-07-30 03:16:49,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2116/ 3125], loss: 0.236, per_step_time: 1412ms, lr: 9.029391e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:49,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.66256 samples/s/p 2:50:55 } +2024-07-30 03:16:52,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2118/ 3125], loss: 0.295, per_step_time: 1412ms, lr: 9.027343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:52,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.66183 samples/s/p 2:50:53 } +2024-07-30 03:16:54,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2120/ 3125], loss: 0.335, per_step_time: 1413ms, lr: 9.025296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:54,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.66161 samples/s/p 2:50:51 } +2024-07-30 03:16:57,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2122/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 9.023245e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:57,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.66119 samples/s/p 2:50:49 } +2024-07-30 03:17:00,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2124/ 3125], loss: 0.057, per_step_time: 1413ms, lr: 9.021193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:00,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.65990 samples/s/p 2:50:48 } +2024-07-30 03:17:03,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2126/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 9.019139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:03,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.66161 samples/s/p 2:50:43 } +2024-07-30 03:17:06,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2128/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 9.017082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:06,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.66034 samples/s/p 2:50:42 } +2024-07-30 03:17:09,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2130/ 3125], loss: 0.311, per_step_time: 1412ms, lr: 9.015024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:09,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.66192 samples/s/p 2:50:36 } +2024-07-30 03:17:11,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2132/ 3125], loss: 0.164, per_step_time: 1413ms, lr: 9.012964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:11,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.66020 samples/s/p 2:50:37 } +2024-07-30 03:17:14,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2134/ 3125], loss: 0.291, per_step_time: 1413ms, lr: 9.010902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:14,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.65777 samples/s/p 2:50:38 } +2024-07-30 03:17:17,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2136/ 3125], loss: 0.086, per_step_time: 1413ms, lr: 9.008838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:17,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.66102 samples/s/p 2:50:29 } +2024-07-30 03:17:20,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2138/ 3125], loss: 0.397, per_step_time: 1412ms, lr: 9.006773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:20,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.66179 samples/s/p 2:50:25 } +2024-07-30 03:17:23,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2140/ 3125], loss: 0.387, per_step_time: 1416ms, lr: 9.004705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:23,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.64914 samples/s/p 2:50:45 } +2024-07-30 03:17:26,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2142/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 9.002635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:26,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.65997 samples/s/p 2:50:23 } +2024-07-30 03:17:28,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2144/ 3125], loss: 0.336, per_step_time: 1414ms, lr: 9.000564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:28,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.65406 samples/s/p 2:50:31 } +2024-07-30 03:17:31,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2146/ 3125], loss: 0.369, per_step_time: 1412ms, lr: 8.998491e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:31,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.66186 samples/s/p 2:50:14 } +2024-07-30 03:17:34,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2148/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 8.996415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:34,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.66045 samples/s/p 2:50:14 } +2024-07-30 03:17:37,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2150/ 3125], loss: 0.067, per_step_time: 1413ms, lr: 8.994339e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:37,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.66125 samples/s/p 2:50:09 } +2024-07-30 03:17:40,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2152/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 8.992258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:40,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.65960 samples/s/p 2:50:09 } +2024-07-30 03:17:43,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2154/ 3125], loss: 0.204, per_step_time: 1412ms, lr: 8.990178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:43,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.66191 samples/s/p 2:50:02 } +2024-07-30 03:17:45,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2156/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 8.988095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:45,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.66013 samples/s/p 2:50:03 } +2024-07-30 03:17:48,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2158/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 8.9860105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:48,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.65964 samples/s/p 2:50:01 } +2024-07-30 03:17:51,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2160/ 3125], loss: 0.406, per_step_time: 1412ms, lr: 8.983923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:51,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.66268 samples/s/p 2:49:53 } +2024-07-30 03:17:54,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2162/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 8.981835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:54,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.66007 samples/s/p 2:49:54 } +2024-07-30 03:17:57,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2164/ 3125], loss: 0.318, per_step_time: 1414ms, lr: 8.979744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:57,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.65659 samples/s/p 2:49:58 } +2024-07-30 03:18:00,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2166/ 3125], loss: 0.411, per_step_time: 1412ms, lr: 8.977651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:00,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.66176 samples/s/p 2:49:46 } +2024-07-30 03:18:02,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2168/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 8.975558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:02,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.65932 samples/s/p 2:49:47 } +2024-07-30 03:18:05,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2170/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 8.973461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:05,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.65918 samples/s/p 2:49:45 } +2024-07-30 03:18:08,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2172/ 3125], loss: 0.114, per_step_time: 1413ms, lr: 8.971362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:08,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.66082 samples/s/p 2:49:39 } +2024-07-30 03:18:11,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2174/ 3125], loss: 0.497, per_step_time: 1413ms, lr: 8.969263e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:11,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.65873 samples/s/p 2:49:40 } +2024-07-30 03:18:14,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2176/ 3125], loss: 0.241, per_step_time: 1414ms, lr: 8.967161e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:14,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.65483 samples/s/p 2:49:44 } +2024-07-30 03:18:17,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2178/ 3125], loss: 0.211, per_step_time: 1414ms, lr: 8.9650575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:17,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.65732 samples/s/p 2:49:37 } +2024-07-30 03:18:19,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2180/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 8.962952e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:19,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.65988 samples/s/p 2:49:29 } +2024-07-30 03:18:22,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2182/ 3125], loss: 0.547, per_step_time: 1413ms, lr: 8.960844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:22,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.65982 samples/s/p 2:49:27 } +2024-07-30 03:18:25,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2184/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 8.958734e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:25,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.65820 samples/s/p 2:49:27 } +2024-07-30 03:18:28,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2186/ 3125], loss: 0.458, per_step_time: 1414ms, lr: 8.956623e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:28,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.65702 samples/s/p 2:49:26 } +2024-07-30 03:18:31,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2188/ 3125], loss: 0.372, per_step_time: 1414ms, lr: 8.954509e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:31,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.65699 samples/s/p 2:49:23 } +2024-07-30 03:18:34,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2190/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 8.952395e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:34,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.66072 samples/s/p 2:49:14 } +2024-07-30 03:18:36,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2192/ 3125], loss: 0.120, per_step_time: 1413ms, lr: 8.950277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:36,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.66058 samples/s/p 2:49:11 } +2024-07-30 03:18:39,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2194/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 8.948158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:39,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.66164 samples/s/p 2:49:06 } +2024-07-30 03:18:42,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2196/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 8.946038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:42,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.65991 samples/s/p 2:49:07 } +2024-07-30 03:18:45,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2198/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 8.943915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:45,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.65981 samples/s/p 2:49:04 } +2024-07-30 03:18:48,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2200/ 3125], loss: 0.220, per_step_time: 1412ms, lr: 8.94179e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:48,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.66191 samples/s/p 2:48:57 } +2024-07-30 03:18:51,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2202/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 8.939664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:51,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.66091 samples/s/p 2:48:56 } +2024-07-30 03:18:53,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2204/ 3125], loss: 0.249, per_step_time: 1415ms, lr: 8.937535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:53,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.65131 samples/s/p 2:49:11 } +2024-07-30 03:18:56,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2206/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 8.935404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:56,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.66165 samples/s/p 2:48:49 } +2024-07-30 03:18:59,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2208/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 8.9332725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:59,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.66016 samples/s/p 2:48:49 } +2024-07-30 03:19:02,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2210/ 3125], loss: 0.392, per_step_time: 1412ms, lr: 8.931139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:02,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.66407 samples/s/p 2:48:39 } +2024-07-30 03:19:05,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2212/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 8.929003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:05,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.65947 samples/s/p 2:48:45 } +2024-07-30 03:19:08,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2214/ 3125], loss: 0.446, per_step_time: 1416ms, lr: 8.926866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:08,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.64950 samples/s/p 2:49:00 } +2024-07-30 03:19:10,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2216/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 8.924726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:10,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.66093 samples/s/p 2:48:37 } +2024-07-30 03:19:13,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2218/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 8.922584e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:13,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.66065 samples/s/p 2:48:34 } +2024-07-30 03:19:16,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2220/ 3125], loss: 0.357, per_step_time: 1424ms, lr: 8.92044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:16,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.61551 samples/s/p 2:49:53 } +2024-07-30 03:19:19,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2222/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 8.918296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:19,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.65917 samples/s/p 2:48:31 } +2024-07-30 03:19:22,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2224/ 3125], loss: 0.337, per_step_time: 1412ms, lr: 8.916148e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:22,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.66244 samples/s/p 2:48:23 } +2024-07-30 03:19:25,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2226/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 8.913999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:25,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.66087 samples/s/p 2:48:23 } +2024-07-30 03:19:27,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2228/ 3125], loss: 0.122, per_step_time: 1413ms, lr: 8.911848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:27,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.66153 samples/s/p 2:48:19 } +2024-07-30 03:19:30,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2230/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 8.909696e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:30,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.65976 samples/s/p 2:48:19 } +2024-07-30 03:19:33,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2232/ 3125], loss: 0.463, per_step_time: 1413ms, lr: 8.907542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:33,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.66084 samples/s/p 2:48:14 } +2024-07-30 03:19:36,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2234/ 3125], loss: 0.355, per_step_time: 1415ms, lr: 8.905385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:36,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.65033 samples/s/p 2:48:30 } +2024-07-30 03:19:39,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2236/ 3125], loss: 0.187, per_step_time: 1414ms, lr: 8.903226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:39,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.65475 samples/s/p 2:48:19 } +2024-07-30 03:19:42,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2238/ 3125], loss: 0.119, per_step_time: 1414ms, lr: 8.901066e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:42,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.65694 samples/s/p 2:48:13 } +2024-07-30 03:19:45,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2240/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 8.8989045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:45,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.65920 samples/s/p 2:48:06 } +2024-07-30 03:19:47,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2242/ 3125], loss: 0.383, per_step_time: 1413ms, lr: 8.896741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:47,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.65976 samples/s/p 2:48:02 } +2024-07-30 03:19:50,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2244/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 8.894574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:50,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.66163 samples/s/p 2:47:56 } +2024-07-30 03:19:53,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2246/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 8.892407e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:53,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |███████████ | 5.66049 samples/s/p 2:47:55 } +2024-07-30 03:19:56,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2248/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 8.890238e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:56,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |███████████ | 5.66017 samples/s/p 2:47:53 } +2024-07-30 03:19:59,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2250/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 8.888067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:59,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.66033 samples/s/p 2:47:50 } +2024-07-30 03:20:02,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2252/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 8.885892e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:02,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.66136 samples/s/p 2:47:45 } +2024-07-30 03:20:04,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2254/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 8.883718e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:04,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.66061 samples/s/p 2:47:43 } +2024-07-30 03:20:07,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2256/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 8.881541e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:07,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.65957 samples/s/p 2:47:42 } +2024-07-30 03:20:10,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2258/ 3125], loss: 0.159, per_step_time: 1416ms, lr: 8.879362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:10,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.64855 samples/s/p 2:47:59 } +2024-07-30 03:20:13,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2260/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 8.877181e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:13,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.66049 samples/s/p 2:47:35 } +2024-07-30 03:20:16,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2262/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 8.874999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:16,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.66020 samples/s/p 2:47:33 } +2024-07-30 03:20:19,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2264/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 8.872815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:19,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.65798 samples/s/p 2:47:34 } +2024-07-30 03:20:21,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2266/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 8.870629e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:21,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.66019 samples/s/p 2:47:27 } +2024-07-30 03:20:24,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2268/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.86844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:24,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.66036 samples/s/p 2:47:24 } +2024-07-30 03:20:27,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2270/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 8.86625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:27,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.66124 samples/s/p 2:47:20 } +2024-07-30 03:20:30,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2272/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 8.864059e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:30,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.66031 samples/s/p 2:47:19 } +2024-07-30 03:20:33,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2274/ 3125], loss: 0.117, per_step_time: 1412ms, lr: 8.861865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:33,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.66172 samples/s/p 2:47:13 } +2024-07-30 03:20:36,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2276/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 8.85967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:36,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.65930 samples/s/p 2:47:15 } +2024-07-30 03:20:38,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2278/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 8.8574725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:38,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.65954 samples/s/p 2:47:11 } +2024-07-30 03:20:41,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2280/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 8.855273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:41,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.65956 samples/s/p 2:47:09 } +2024-07-30 03:20:44,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2282/ 3125], loss: 0.246, per_step_time: 1412ms, lr: 8.853073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:44,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.66189 samples/s/p 2:47:02 } +2024-07-30 03:20:47,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2284/ 3125], loss: 0.197, per_step_time: 1414ms, lr: 8.85087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:47,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.65591 samples/s/p 2:47:09 } +2024-07-30 03:20:50,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2286/ 3125], loss: 0.174, per_step_time: 1414ms, lr: 8.848665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:50,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.65490 samples/s/p 2:47:08 } +2024-07-30 03:20:53,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2288/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 8.8464585e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:53,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.66167 samples/s/p 2:46:54 } +2024-07-30 03:20:55,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2290/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 8.84425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:55,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.66126 samples/s/p 2:46:51 } +2024-07-30 03:20:58,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2292/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 8.842041e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:58,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.65923 samples/s/p 2:46:52 } +2024-07-30 03:21:01,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2294/ 3125], loss: 0.151, per_step_time: 1413ms, lr: 8.839828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:01,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.65863 samples/s/p 2:46:50 } +2024-07-30 03:21:04,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2296/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 8.837615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:04,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.65808 samples/s/p 2:46:49 } +2024-07-30 03:21:07,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2298/ 3125], loss: 0.244, per_step_time: 1414ms, lr: 8.835399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:07,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.65404 samples/s/p 2:46:53 } +2024-07-30 03:21:10,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2300/ 3125], loss: 0.378, per_step_time: 1414ms, lr: 8.833182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:10,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.65396 samples/s/p 2:46:50 } +2024-07-30 03:21:12,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2302/ 3125], loss: 0.556, per_step_time: 1413ms, lr: 8.8309625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:12,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.65857 samples/s/p 2:46:39 } +2024-07-30 03:21:15,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2304/ 3125], loss: 0.383, per_step_time: 1413ms, lr: 8.828741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:15,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.65983 samples/s/p 2:46:34 } +2024-07-30 03:21:18,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2306/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 8.826519e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:18,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.65810 samples/s/p 2:46:34 } +2024-07-30 03:21:21,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2308/ 3125], loss: 0.211, per_step_time: 1415ms, lr: 8.824293e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:21,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.65304 samples/s/p 2:46:40 } +2024-07-30 03:21:24,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2310/ 3125], loss: 0.327, per_step_time: 1412ms, lr: 8.822068e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:24,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.66240 samples/s/p 2:46:21 } +2024-07-30 03:21:27,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2312/ 3125], loss: 0.224, per_step_time: 1416ms, lr: 8.8198385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:27,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.64968 samples/s/p 2:46:41 } +2024-07-30 03:21:29,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2314/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 8.817608e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:29,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.66149 samples/s/p 2:46:17 } +2024-07-30 03:21:32,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2316/ 3125], loss: 0.142, per_step_time: 1412ms, lr: 8.8153765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:32,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.66286 samples/s/p 2:46:12 } +2024-07-30 03:21:35,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2318/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 8.813143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:35,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.65951 samples/s/p 2:46:15 } +2024-07-30 03:21:38,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2320/ 3125], loss: 0.192, per_step_time: 1412ms, lr: 8.810907e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:38,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.66288 samples/s/p 2:46:06 } +2024-07-30 03:21:41,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2322/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 8.808669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:41,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.66148 samples/s/p 2:46:06 } +2024-07-30 03:21:44,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2324/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.80643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:44,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.66051 samples/s/p 2:46:05 } +2024-07-30 03:21:46,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2326/ 3125], loss: 0.665, per_step_time: 1413ms, lr: 8.804189e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:46,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.66072 samples/s/p 2:46:01 } +2024-07-30 03:21:49,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2328/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 8.801945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:49,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.66021 samples/s/p 2:46:00 } +2024-07-30 03:21:52,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2330/ 3125], loss: 0.517, per_step_time: 1413ms, lr: 8.7997005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:52,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.65955 samples/s/p 2:45:58 } +2024-07-30 03:21:55,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2332/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 8.797455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:55,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.65937 samples/s/p 2:45:55 } +2024-07-30 03:21:58,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2334/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 8.795207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:58,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.66021 samples/s/p 2:45:51 } +2024-07-30 03:22:01,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2336/ 3125], loss: 0.307, per_step_time: 1412ms, lr: 8.792956e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:01,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.66201 samples/s/p 2:45:45 } +2024-07-30 03:22:03,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2338/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 8.790704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:03,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.65924 samples/s/p 2:45:47 } +2024-07-30 03:22:06,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2340/ 3125], loss: 0.059, per_step_time: 1413ms, lr: 8.788449e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:06,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.66143 samples/s/p 2:45:40 } +2024-07-30 03:22:09,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2342/ 3125], loss: 0.110, per_step_time: 1413ms, lr: 8.7861945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:09,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.66162 samples/s/p 2:45:37 } +2024-07-30 03:22:12,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2344/ 3125], loss: 0.222, per_step_time: 1412ms, lr: 8.783937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:12,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.66219 samples/s/p 2:45:33 } +2024-07-30 03:22:15,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2346/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 8.781677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:15,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.66099 samples/s/p 2:45:33 } +2024-07-30 03:22:18,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2348/ 3125], loss: 0.086, per_step_time: 1413ms, lr: 8.779416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:18,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.65871 samples/s/p 2:45:34 } +2024-07-30 03:22:20,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2350/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 8.777153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:20,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.65991 samples/s/p 2:45:29 } +2024-07-30 03:22:23,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2352/ 3125], loss: 0.291, per_step_time: 1412ms, lr: 8.774889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:23,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.66196 samples/s/p 2:45:23 } +2024-07-30 03:22:26,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2354/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 8.772622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:26,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.65814 samples/s/p 2:45:26 } +2024-07-30 03:22:29,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2356/ 3125], loss: 0.190, per_step_time: 1414ms, lr: 8.770355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:29,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.65720 samples/s/p 2:45:25 } +2024-07-30 03:22:32,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2358/ 3125], loss: 0.312, per_step_time: 1415ms, lr: 8.768084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:32,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.65301 samples/s/p 2:45:30 } +2024-07-30 03:22:35,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2360/ 3125], loss: 0.515, per_step_time: 1413ms, lr: 8.765812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:35,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.66168 samples/s/p 2:45:12 } +2024-07-30 03:22:37,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2362/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 8.763538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:37,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.65849 samples/s/p 2:45:15 } +2024-07-30 03:22:40,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2364/ 3125], loss: 0.183, per_step_time: 1418ms, lr: 8.7612625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:40,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.63795 samples/s/p 2:45:48 } +2024-07-30 03:22:43,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2366/ 3125], loss: 0.127, per_step_time: 1413ms, lr: 8.758985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:43,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.66096 samples/s/p 2:45:05 } +2024-07-30 03:22:46,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2368/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 8.756707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:46,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.65882 samples/s/p 2:45:05 } +2024-07-30 03:22:49,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2370/ 3125], loss: 0.141, per_step_time: 1413ms, lr: 8.754426e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:49,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.65952 samples/s/p 2:45:01 } +2024-07-30 03:22:52,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2372/ 3125], loss: 0.340, per_step_time: 1414ms, lr: 8.752143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:52,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.65525 samples/s/p 2:45:06 } +2024-07-30 03:22:54,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2374/ 3125], loss: 0.473, per_step_time: 1412ms, lr: 8.749858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:54,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.66192 samples/s/p 2:44:52 } +2024-07-30 03:22:57,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2376/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 8.747572e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:57,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.66051 samples/s/p 2:44:51 } +2024-07-30 03:23:00,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2378/ 3125], loss: 0.094, per_step_time: 1413ms, lr: 8.745284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:00,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.65846 samples/s/p 2:44:52 } +2024-07-30 03:23:03,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2380/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 8.7429935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:03,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.65824 samples/s/p 2:44:50 } +2024-07-30 03:23:06,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2382/ 3125], loss: 0.261, per_step_time: 1412ms, lr: 8.7407025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:06,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.66266 samples/s/p 2:44:39 } +2024-07-30 03:23:09,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2384/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 8.738409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:09,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.66030 samples/s/p 2:44:40 } +2024-07-30 03:23:11,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2386/ 3125], loss: 0.167, per_step_time: 1412ms, lr: 8.736114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:11,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.66255 samples/s/p 2:44:33 } +2024-07-30 03:23:14,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2388/ 3125], loss: 0.389, per_step_time: 1412ms, lr: 8.733817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:14,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.66223 samples/s/p 2:44:31 } +2024-07-30 03:23:17,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2390/ 3125], loss: 0.474, per_step_time: 1413ms, lr: 8.731518e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:17,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.66122 samples/s/p 2:44:30 } +2024-07-30 03:23:20,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2392/ 3125], loss: 0.226, per_step_time: 1412ms, lr: 8.729217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:20,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.66244 samples/s/p 2:44:25 } +2024-07-30 03:23:23,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2394/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 8.726915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:23,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.65990 samples/s/p 2:44:27 } +2024-07-30 03:23:26,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2396/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 8.724612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:26,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.66017 samples/s/p 2:44:24 } +2024-07-30 03:23:28,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2398/ 3125], loss: 0.353, per_step_time: 1413ms, lr: 8.722305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:28,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.66025 samples/s/p 2:44:21 } +2024-07-30 03:23:31,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2400/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 8.719997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:31,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.65928 samples/s/p 2:44:19 } +2024-07-30 03:23:34,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2402/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 8.717688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:34,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.65962 samples/s/p 2:44:16 } +2024-07-30 03:23:37,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2404/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 8.715378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:37,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.66023 samples/s/p 2:44:12 } +2024-07-30 03:23:40,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2406/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 8.713065e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:40,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.66089 samples/s/p 2:44:08 } +2024-07-30 03:23:43,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2408/ 3125], loss: 0.264, per_step_time: 1415ms, lr: 8.710749e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:43,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.65145 samples/s/p 2:44:22 } +2024-07-30 03:23:45,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2410/ 3125], loss: 0.300, per_step_time: 1412ms, lr: 8.708433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:45,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.66203 samples/s/p 2:44:00 } +2024-07-30 03:23:48,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2412/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 8.706115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:48,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.66147 samples/s/p 2:43:59 } +2024-07-30 03:23:51,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2414/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 8.703795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:51,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.66129 samples/s/p 2:43:56 } +2024-07-30 03:23:54,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2416/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 8.701472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:54,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.66159 samples/s/p 2:43:53 } +2024-07-30 03:23:57,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2418/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 8.699149e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:57,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.66061 samples/s/p 2:43:52 } +2024-07-30 03:24:00,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2420/ 3125], loss: 0.363, per_step_time: 1413ms, lr: 8.696824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:00,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.66143 samples/s/p 2:43:47 } +2024-07-30 03:24:02,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2422/ 3125], loss: 0.210, per_step_time: 1415ms, lr: 8.694497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:02,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.65293 samples/s/p 2:43:59 } +2024-07-30 03:24:05,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2424/ 3125], loss: 0.583, per_step_time: 1413ms, lr: 8.692168e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:05,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.65911 samples/s/p 2:43:46 } +2024-07-30 03:24:08,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2426/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 8.689837e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:08,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.65949 samples/s/p 2:43:42 } +2024-07-30 03:24:11,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2428/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 8.687505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:11,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.66125 samples/s/p 2:43:36 } +2024-07-30 03:24:14,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2430/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 8.6851705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:14,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.66152 samples/s/p 2:43:33 } +2024-07-30 03:24:17,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2432/ 3125], loss: 0.409, per_step_time: 1415ms, lr: 8.682835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:17,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.65330 samples/s/p 2:43:45 } +2024-07-30 03:24:19,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2434/ 3125], loss: 0.359, per_step_time: 1412ms, lr: 8.680497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:19,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |████████████ | 5.66207 samples/s/p 2:43:27 } +2024-07-30 03:24:22,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2436/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 8.678157e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:22,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |████████████ | 5.65865 samples/s/p 2:43:30 } +2024-07-30 03:24:25,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2438/ 3125], loss: 0.460, per_step_time: 1414ms, lr: 8.675816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:25,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.65538 samples/s/p 2:43:32 } +2024-07-30 03:24:28,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2440/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 8.6734735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:28,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.65978 samples/s/p 2:43:22 } +2024-07-30 03:24:31,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2442/ 3125], loss: 0.319, per_step_time: 1414ms, lr: 8.671129e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:31,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.65722 samples/s/p 2:43:24 } +2024-07-30 03:24:34,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2444/ 3125], loss: 0.472, per_step_time: 1413ms, lr: 8.668782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:34,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.66134 samples/s/p 2:43:14 } +2024-07-30 03:24:36,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2446/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 8.666434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:36,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.65869 samples/s/p 2:43:15 } +2024-07-30 03:24:39,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2448/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 8.664085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:39,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.66044 samples/s/p 2:43:10 } +2024-07-30 03:24:42,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2450/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 8.661733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:42,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.65942 samples/s/p 2:43:08 } +2024-07-30 03:24:45,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2452/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 8.659379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:45,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.66048 samples/s/p 2:43:04 } +2024-07-30 03:24:48,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2454/ 3125], loss: 0.155, per_step_time: 1414ms, lr: 8.6570235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:48,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.65564 samples/s/p 2:43:09 } +2024-07-30 03:24:51,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2456/ 3125], loss: 0.359, per_step_time: 1412ms, lr: 8.654667e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:51,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.66196 samples/s/p 2:42:56 } +2024-07-30 03:24:53,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2458/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 8.652309e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:53,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.65833 samples/s/p 2:42:59 } +2024-07-30 03:24:56,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2460/ 3125], loss: 0.457, per_step_time: 1413ms, lr: 8.649948e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:56,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.66067 samples/s/p 2:42:52 } +2024-07-30 03:24:59,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2462/ 3125], loss: 0.426, per_step_time: 1413ms, lr: 8.647586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:59,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.66103 samples/s/p 2:42:49 } +2024-07-30 03:25:02,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2464/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 8.645222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:02,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.66087 samples/s/p 2:42:46 } +2024-07-30 03:25:05,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2466/ 3125], loss: 0.425, per_step_time: 1412ms, lr: 8.642855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:05,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.66256 samples/s/p 2:42:40 } +2024-07-30 03:25:08,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2468/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 8.640488e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:08,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.65960 samples/s/p 2:42:43 } +2024-07-30 03:25:10,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2470/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 8.638119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:10,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.65797 samples/s/p 2:42:43 } +2024-07-30 03:25:13,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2472/ 3125], loss: 0.181, per_step_time: 1414ms, lr: 8.635749e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:13,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.65561 samples/s/p 2:42:44 } +2024-07-30 03:25:16,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2474/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 8.633376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:16,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.65899 samples/s/p 2:42:35 } +2024-07-30 03:25:19,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2476/ 3125], loss: 0.425, per_step_time: 1414ms, lr: 8.631002e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:19,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.65607 samples/s/p 2:42:38 } +2024-07-30 03:25:22,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2478/ 3125], loss: 0.303, per_step_time: 1414ms, lr: 8.628625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:22,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.65608 samples/s/p 2:42:35 } +2024-07-30 03:25:25,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2480/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 8.626247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:25,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.66067 samples/s/p 2:42:24 } +2024-07-30 03:25:27,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2482/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 8.623868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:27,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.66045 samples/s/p 2:42:21 } +2024-07-30 03:25:30,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2484/ 3125], loss: 0.112, per_step_time: 1412ms, lr: 8.621487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:30,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.66213 samples/s/p 2:42:16 } +2024-07-30 03:25:33,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2486/ 3125], loss: 0.228, per_step_time: 1412ms, lr: 8.619103e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:33,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.66180 samples/s/p 2:42:14 } +2024-07-30 03:25:36,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2488/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 8.616719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:36,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.65951 samples/s/p 2:42:15 } +2024-07-30 03:25:39,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2490/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 8.614333e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:39,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.65929 samples/s/p 2:42:12 } +2024-07-30 03:25:42,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2492/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 8.611944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:42,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.65821 samples/s/p 2:42:11 } +2024-07-30 03:25:44,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2494/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 8.609554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:44,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.65971 samples/s/p 2:42:06 } +2024-07-30 03:25:47,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2496/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 8.607162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:47,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.65919 samples/s/p 2:42:04 } +2024-07-30 03:25:50,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2498/ 3125], loss: 0.185, per_step_time: 1412ms, lr: 8.6047685e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:50,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.66195 samples/s/p 2:41:56 } +2024-07-30 03:25:53,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2500/ 3125], loss: 0.103, per_step_time: 1413ms, lr: 8.602375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:53,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.65995 samples/s/p 2:41:57 } +2024-07-30 03:25:56,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2502/ 3125], loss: 0.338, per_step_time: 1414ms, lr: 8.599976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:56,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.65705 samples/s/p 2:41:59 } +2024-07-30 03:25:59,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2504/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 8.597579e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:59,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.65814 samples/s/p 2:41:54 } +2024-07-30 03:26:01,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2506/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 8.595178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:01,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.65980 samples/s/p 2:41:49 } +2024-07-30 03:26:04,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2508/ 3125], loss: 0.387, per_step_time: 1412ms, lr: 8.592777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:04,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.66225 samples/s/p 2:41:42 } +2024-07-30 03:26:07,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2510/ 3125], loss: 0.373, per_step_time: 1412ms, lr: 8.590373e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:07,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.66175 samples/s/p 2:41:40 } +2024-07-30 03:26:10,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2512/ 3125], loss: 0.230, per_step_time: 1416ms, lr: 8.587968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:10,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.64853 samples/s/p 2:42:00 } +2024-07-30 03:26:13,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2514/ 3125], loss: 0.258, per_step_time: 1414ms, lr: 8.58556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:13,310 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.65388 samples/s/p 2:41:48 } +2024-07-30 03:26:16,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2516/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 8.5831525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:16,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.66019 samples/s/p 2:41:34 } +2024-07-30 03:26:18,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2518/ 3125], loss: 0.340, per_step_time: 1414ms, lr: 8.580741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:18,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.65697 samples/s/p 2:41:37 } +2024-07-30 03:26:21,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2520/ 3125], loss: 0.080, per_step_time: 1413ms, lr: 8.578329e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:21,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.66016 samples/s/p 2:41:28 } +2024-07-30 03:26:24,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2522/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 8.575915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:24,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.65997 samples/s/p 2:41:26 } +2024-07-30 03:26:27,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2524/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 8.573499e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:27,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.65866 samples/s/p 2:41:25 } +2024-07-30 03:26:30,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2526/ 3125], loss: 0.306, per_step_time: 1412ms, lr: 8.571082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:30,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.66176 samples/s/p 2:41:17 } +2024-07-30 03:26:33,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2528/ 3125], loss: 0.300, per_step_time: 1414ms, lr: 8.568663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:33,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.65684 samples/s/p 2:41:23 } +2024-07-30 03:26:35,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2530/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 8.566242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:35,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.65891 samples/s/p 2:41:16 } +2024-07-30 03:26:38,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2532/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 8.563819e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:38,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.66036 samples/s/p 2:41:11 } +2024-07-30 03:26:41,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2534/ 3125], loss: 0.080, per_step_time: 1413ms, lr: 8.561396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:41,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.66086 samples/s/p 2:41:07 } +2024-07-30 03:26:44,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2536/ 3125], loss: 0.029, per_step_time: 1412ms, lr: 8.55897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:44,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.66200 samples/s/p 2:41:03 } +2024-07-30 03:26:47,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2538/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 8.556542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:47,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.65977 samples/s/p 2:41:03 } +2024-07-30 03:26:50,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2540/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 8.554112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:50,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.66106 samples/s/p 2:40:58 } +2024-07-30 03:26:52,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2542/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 8.551682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:52,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.66009 samples/s/p 2:40:57 } +2024-07-30 03:26:55,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2544/ 3125], loss: 0.513, per_step_time: 1412ms, lr: 8.549249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:55,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.66238 samples/s/p 2:40:51 } +2024-07-30 03:26:58,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2546/ 3125], loss: 0.527, per_step_time: 1413ms, lr: 8.546815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:58,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.66070 samples/s/p 2:40:51 } +2024-07-30 03:27:01,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2548/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 8.544379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:01,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.66140 samples/s/p 2:40:47 } +2024-07-30 03:27:04,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2550/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 8.541941e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:04,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.65911 samples/s/p 2:40:48 } +2024-07-30 03:27:07,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2552/ 3125], loss: 0.393, per_step_time: 1413ms, lr: 8.539501e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:07,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.66044 samples/s/p 2:40:43 } +2024-07-30 03:27:09,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2554/ 3125], loss: 0.224, per_step_time: 1412ms, lr: 8.537061e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:09,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.66198 samples/s/p 2:40:37 } +2024-07-30 03:27:12,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2556/ 3125], loss: 0.344, per_step_time: 1414ms, lr: 8.534618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:12,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.65494 samples/s/p 2:40:46 } +2024-07-30 03:27:15,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2558/ 3125], loss: 0.511, per_step_time: 1414ms, lr: 8.532173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:15,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.65625 samples/s/p 2:40:41 } +2024-07-30 03:27:18,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2560/ 3125], loss: 0.267, per_step_time: 1414ms, lr: 8.529727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:18,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.65671 samples/s/p 2:40:38 } +2024-07-30 03:27:21,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2562/ 3125], loss: 0.235, per_step_time: 1413ms, lr: 8.5272795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:21,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.65980 samples/s/p 2:40:30 } +2024-07-30 03:27:24,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2564/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 8.52483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:24,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.65987 samples/s/p 2:40:27 } +2024-07-30 03:27:26,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2566/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 8.522378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:26,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.65845 samples/s/p 2:40:26 } +2024-07-30 03:27:29,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2568/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 8.519925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:29,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.66148 samples/s/p 2:40:18 } +2024-07-30 03:27:32,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2570/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 8.517471e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:32,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.66061 samples/s/p 2:40:17 } +2024-07-30 03:27:35,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2572/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 8.515014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:35,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.66001 samples/s/p 2:40:15 } +2024-07-30 03:27:38,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2574/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 8.512557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:38,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.65919 samples/s/p 2:40:14 } +2024-07-30 03:27:41,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2576/ 3125], loss: 0.606, per_step_time: 1414ms, lr: 8.510097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:41,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.65544 samples/s/p 2:40:17 } +2024-07-30 03:27:43,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2578/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 8.507635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:44,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.65912 samples/s/p 2:40:08 } +2024-07-30 03:27:46,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2580/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 8.505172e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:46,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.66138 samples/s/p 2:40:01 } +2024-07-30 03:27:49,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2582/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 8.502709e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:49,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.66084 samples/s/p 2:39:59 } +2024-07-30 03:27:52,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2584/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 8.500242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:52,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.65966 samples/s/p 2:39:59 } +2024-07-30 03:27:55,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2586/ 3125], loss: 0.349, per_step_time: 1414ms, lr: 8.497773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:55,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.65679 samples/s/p 2:40:01 } +2024-07-30 03:27:58,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2588/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 8.495304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:58,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.66124 samples/s/p 2:39:50 } +2024-07-30 03:28:01,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2590/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 8.492833e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:01,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.65887 samples/s/p 2:39:52 } +2024-07-30 03:28:03,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2592/ 3125], loss: 0.391, per_step_time: 1413ms, lr: 8.4903595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:03,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.66146 samples/s/p 2:39:44 } +2024-07-30 03:28:06,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2594/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 8.487885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:06,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.65996 samples/s/p 2:39:44 } +2024-07-30 03:28:09,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2596/ 3125], loss: 0.185, per_step_time: 1412ms, lr: 8.485409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:09,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.66284 samples/s/p 2:39:36 } +2024-07-30 03:28:12,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2598/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 8.482931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:12,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.66086 samples/s/p 2:39:37 } +2024-07-30 03:28:15,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2600/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 8.480451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:15,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.65979 samples/s/p 2:39:36 } +2024-07-30 03:28:18,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2602/ 3125], loss: 0.205, per_step_time: 1414ms, lr: 8.477969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:18,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.65625 samples/s/p 2:39:39 } +2024-07-30 03:28:20,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2604/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 8.4754865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:20,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.66128 samples/s/p 2:39:28 } +2024-07-30 03:28:23,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2606/ 3125], loss: 0.323, per_step_time: 1424ms, lr: 8.473002e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:23,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.61419 samples/s/p 2:40:45 } +2024-07-30 03:28:26,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2608/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 8.470515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:26,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.66113 samples/s/p 2:39:22 } +2024-07-30 03:28:29,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2610/ 3125], loss: 0.296, per_step_time: 1412ms, lr: 8.468027e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:29,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.66237 samples/s/p 2:39:17 } +2024-07-30 03:28:32,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2612/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 8.465538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:32,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.65934 samples/s/p 2:39:20 } +2024-07-30 03:28:35,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2614/ 3125], loss: 0.263, per_step_time: 1414ms, lr: 8.4630465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:35,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.65721 samples/s/p 2:39:20 } +2024-07-30 03:28:37,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2616/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 8.4605535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:37,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.65850 samples/s/p 2:39:15 } +2024-07-30 03:28:40,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2618/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 8.45806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:40,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.66103 samples/s/p 2:39:08 } +2024-07-30 03:28:43,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2620/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 8.455562e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:43,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.65809 samples/s/p 2:39:10 } +2024-07-30 03:28:46,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2622/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 8.453065e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:46,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |█████████████ | 5.65824 samples/s/p 2:39:07 } +2024-07-30 03:28:49,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2624/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 8.4505655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:49,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |█████████████ | 5.66038 samples/s/p 2:39:01 } +2024-07-30 03:28:52,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2626/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 8.448064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:52,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.66105 samples/s/p 2:38:57 } +2024-07-30 03:28:54,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2628/ 3125], loss: 0.112, per_step_time: 1414ms, lr: 8.445561e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:54,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.65619 samples/s/p 2:39:02 } +2024-07-30 03:28:57,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2630/ 3125], loss: 0.297, per_step_time: 1412ms, lr: 8.443058e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:57,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.66188 samples/s/p 2:38:50 } +2024-07-30 03:29:00,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2632/ 3125], loss: 0.303, per_step_time: 1414ms, lr: 8.440551e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:00,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.65435 samples/s/p 2:39:00 } +2024-07-30 03:29:03,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2634/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.438044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:03,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.65980 samples/s/p 2:38:48 } +2024-07-30 03:29:06,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2636/ 3125], loss: 0.294, per_step_time: 1412ms, lr: 8.435534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:06,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.66305 samples/s/p 2:38:39 } +2024-07-30 03:29:09,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2638/ 3125], loss: 0.058, per_step_time: 1415ms, lr: 8.433022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:09,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.65162 samples/s/p 2:38:56 } +2024-07-30 03:29:11,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2640/ 3125], loss: 0.218, per_step_time: 1412ms, lr: 8.43051e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:11,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.66359 samples/s/p 2:38:33 } +2024-07-30 03:29:14,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2642/ 3125], loss: 0.335, per_step_time: 1413ms, lr: 8.427995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:14,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.66002 samples/s/p 2:38:36 } +2024-07-30 03:29:17,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2644/ 3125], loss: 0.282, per_step_time: 1416ms, lr: 8.425479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:17,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.64697 samples/s/p 2:38:55 } +2024-07-30 03:29:20,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2646/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 8.422962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:20,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.65943 samples/s/p 2:38:31 } +2024-07-30 03:29:23,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2648/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 8.420443e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:23,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.65921 samples/s/p 2:38:29 } +2024-07-30 03:29:26,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2650/ 3125], loss: 0.492, per_step_time: 1413ms, lr: 8.417922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:26,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.65990 samples/s/p 2:38:25 } +2024-07-30 03:29:28,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2652/ 3125], loss: 0.169, per_step_time: 1416ms, lr: 8.4154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:28,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.64733 samples/s/p 2:38:43 } +2024-07-30 03:29:31,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2654/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 8.412875e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:31,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.65889 samples/s/p 2:38:21 } +2024-07-30 03:29:34,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2656/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 8.410349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:34,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.66156 samples/s/p 2:38:14 } +2024-07-30 03:29:37,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2658/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 8.407823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:37,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.66010 samples/s/p 2:38:13 } +2024-07-30 03:29:40,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2660/ 3125], loss: 0.666, per_step_time: 1413ms, lr: 8.405293e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:40,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.66096 samples/s/p 2:38:09 } +2024-07-30 03:29:43,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2662/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 8.402762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:43,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.65908 samples/s/p 2:38:09 } +2024-07-30 03:29:45,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2664/ 3125], loss: 0.433, per_step_time: 1413ms, lr: 8.40023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:45,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.65882 samples/s/p 2:38:07 } +2024-07-30 03:29:48,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2666/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.397697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:48,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.65776 samples/s/p 2:38:06 } +2024-07-30 03:29:51,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2668/ 3125], loss: 0.216, per_step_time: 1414ms, lr: 8.395162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:51,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.65538 samples/s/p 2:38:07 } +2024-07-30 03:29:54,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2670/ 3125], loss: 0.426, per_step_time: 1414ms, lr: 8.392624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:54,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.65748 samples/s/p 2:38:01 } +2024-07-30 03:29:57,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2672/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 8.390086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:57,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.66068 samples/s/p 2:37:53 } +2024-07-30 03:30:00,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2674/ 3125], loss: 0.237, per_step_time: 1412ms, lr: 8.387545e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:00,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.66176 samples/s/p 2:37:48 } +2024-07-30 03:30:02,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2676/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 8.385003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:02,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.66149 samples/s/p 2:37:46 } +2024-07-30 03:30:05,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2678/ 3125], loss: 0.156, per_step_time: 1414ms, lr: 8.38246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:05,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.65727 samples/s/p 2:37:50 } +2024-07-30 03:30:08,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2680/ 3125], loss: 0.206, per_step_time: 1412ms, lr: 8.379913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:08,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.66236 samples/s/p 2:37:38 } +2024-07-30 03:30:11,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2682/ 3125], loss: 0.554, per_step_time: 1413ms, lr: 8.377367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:11,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.66128 samples/s/p 2:37:37 } +2024-07-30 03:30:14,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2684/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 8.374818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:14,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.66044 samples/s/p 2:37:36 } +2024-07-30 03:30:17,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2686/ 3125], loss: 0.182, per_step_time: 1412ms, lr: 8.372269e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:17,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.66180 samples/s/p 2:37:31 } +2024-07-30 03:30:19,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2688/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 8.369716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:19,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.66074 samples/s/p 2:37:30 } +2024-07-30 03:30:22,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2690/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 8.367164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:22,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.65794 samples/s/p 2:37:32 } +2024-07-30 03:30:25,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2692/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 8.364609e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:25,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.65987 samples/s/p 2:37:26 } +2024-07-30 03:30:28,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2694/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 8.3620525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:28,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.66008 samples/s/p 2:37:22 } +2024-07-30 03:30:31,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2696/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 8.359494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:31,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.66077 samples/s/p 2:37:19 } +2024-07-30 03:30:34,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2698/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 8.356935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:34,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.65885 samples/s/p 2:37:19 } +2024-07-30 03:30:36,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2700/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 8.354374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:36,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.66058 samples/s/p 2:37:13 } +2024-07-30 03:30:39,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2702/ 3125], loss: 0.419, per_step_time: 1414ms, lr: 8.351811e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:39,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.65737 samples/s/p 2:37:16 } +2024-07-30 03:30:42,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2704/ 3125], loss: 0.374, per_step_time: 1412ms, lr: 8.349247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:42,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.66209 samples/s/p 2:37:05 } +2024-07-30 03:30:45,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2706/ 3125], loss: 0.157, per_step_time: 1412ms, lr: 8.34668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:45,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.66190 samples/s/p 2:37:02 } +2024-07-30 03:30:48,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2708/ 3125], loss: 0.245, per_step_time: 1418ms, lr: 8.344113e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:48,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.63962 samples/s/p 2:37:37 } +2024-07-30 03:30:51,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2710/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 8.3415425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:51,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.65919 samples/s/p 2:37:01 } +2024-07-30 03:30:53,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2712/ 3125], loss: 0.291, per_step_time: 1413ms, lr: 8.338972e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:53,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.65911 samples/s/p 2:36:59 } +2024-07-30 03:30:56,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2714/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 8.336399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:56,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.65993 samples/s/p 2:36:54 } +2024-07-30 03:30:59,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2716/ 3125], loss: 0.380, per_step_time: 1414ms, lr: 8.3338255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:59,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.65585 samples/s/p 2:36:58 } +2024-07-30 03:31:02,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2718/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 8.33125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:02,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.65645 samples/s/p 2:36:55 } +2024-07-30 03:31:05,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2720/ 3125], loss: 0.154, per_step_time: 1415ms, lr: 8.328672e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:05,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.65179 samples/s/p 2:37:00 } +2024-07-30 03:31:08,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2722/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 8.326094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:08,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.66051 samples/s/p 2:36:42 } +2024-07-30 03:31:10,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2724/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 8.323513e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:10,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.66141 samples/s/p 2:36:38 } +2024-07-30 03:31:13,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2726/ 3125], loss: 0.214, per_step_time: 1412ms, lr: 8.320931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:13,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.66286 samples/s/p 2:36:33 } +2024-07-30 03:31:16,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2728/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 8.318348e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:16,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.66070 samples/s/p 2:36:33 } +2024-07-30 03:31:19,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2730/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 8.315763e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:19,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.66086 samples/s/p 2:36:30 } +2024-07-30 03:31:22,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2732/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 8.313175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:22,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.66105 samples/s/p 2:36:27 } +2024-07-30 03:31:25,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2734/ 3125], loss: 0.185, per_step_time: 1412ms, lr: 8.310587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:25,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.66251 samples/s/p 2:36:22 } +2024-07-30 03:31:27,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2736/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 8.307998e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:27,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.65997 samples/s/p 2:36:23 } +2024-07-30 03:31:30,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2738/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 8.3054065e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:30,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.65818 samples/s/p 2:36:23 } +2024-07-30 03:31:33,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2740/ 3125], loss: 0.346, per_step_time: 1416ms, lr: 8.3028135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:33,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.64691 samples/s/p 2:36:39 } +2024-07-30 03:31:36,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2742/ 3125], loss: 0.103, per_step_time: 1413ms, lr: 8.300218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:36,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.66013 samples/s/p 2:36:15 } +2024-07-30 03:31:39,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2744/ 3125], loss: 0.310, per_step_time: 1416ms, lr: 8.297622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:39,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.64643 samples/s/p 2:36:34 } +2024-07-30 03:31:42,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2746/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 8.295025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:42,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.65926 samples/s/p 2:36:10 } +2024-07-30 03:31:44,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2748/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 8.292424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:44,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.65982 samples/s/p 2:36:07 } +2024-07-30 03:31:47,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2750/ 3125], loss: 0.223, per_step_time: 1414ms, lr: 8.289823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:47,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.65647 samples/s/p 2:36:09 } +2024-07-30 03:31:50,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2752/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 8.287221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:50,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.65899 samples/s/p 2:36:02 } +2024-07-30 03:31:53,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2754/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 8.284617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:53,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.65984 samples/s/p 2:35:58 } +2024-07-30 03:31:56,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2756/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 8.282012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:56,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.66005 samples/s/p 2:35:55 } +2024-07-30 03:31:59,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2758/ 3125], loss: 0.384, per_step_time: 1413ms, lr: 8.279404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:59,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.66010 samples/s/p 2:35:52 } +2024-07-30 03:32:01,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2760/ 3125], loss: 0.341, per_step_time: 1412ms, lr: 8.276795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:01,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.66359 samples/s/p 2:35:43 } +2024-07-30 03:32:04,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2762/ 3125], loss: 0.064, per_step_time: 1413ms, lr: 8.274184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:04,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.66121 samples/s/p 2:35:44 } +2024-07-30 03:32:07,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2764/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 8.271573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:07,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.66044 samples/s/p 2:35:43 } +2024-07-30 03:32:10,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2766/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 8.26896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:10,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.66104 samples/s/p 2:35:39 } +2024-07-30 03:32:13,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2768/ 3125], loss: 0.217, per_step_time: 1414ms, lr: 8.266344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:13,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.65477 samples/s/p 2:35:47 } +2024-07-30 03:32:16,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2770/ 3125], loss: 0.292, per_step_time: 1417ms, lr: 8.263728e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:16,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.64535 samples/s/p 2:35:59 } +2024-07-30 03:32:18,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2772/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 8.2611095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:18,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.65834 samples/s/p 2:35:35 } +2024-07-30 03:32:21,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2774/ 3125], loss: 0.234, per_step_time: 1416ms, lr: 8.25849e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:21,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.64729 samples/s/p 2:35:51 } +2024-07-30 03:32:24,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2776/ 3125], loss: 0.142, per_step_time: 1413ms, lr: 8.255868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:24,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.65908 samples/s/p 2:35:28 } +2024-07-30 03:32:27,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2778/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 8.253245e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:27,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.66021 samples/s/p 2:35:24 } +2024-07-30 03:32:30,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2780/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 8.250621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:30,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.66120 samples/s/p 2:35:19 } +2024-07-30 03:32:33,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2782/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 8.2479955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:33,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.66014 samples/s/p 2:35:18 } +2024-07-30 03:32:35,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2784/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 8.245368e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:35,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.66072 samples/s/p 2:35:14 } +2024-07-30 03:32:38,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2786/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 8.242739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:38,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.66015 samples/s/p 2:35:12 } +2024-07-30 03:32:41,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2788/ 3125], loss: 0.381, per_step_time: 1413ms, lr: 8.240108e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:41,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.65905 samples/s/p 2:35:11 } +2024-07-30 03:32:44,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2790/ 3125], loss: 0.280, per_step_time: 1412ms, lr: 8.237476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:44,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.66233 samples/s/p 2:35:03 } +2024-07-30 03:32:47,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2792/ 3125], loss: 0.209, per_step_time: 1414ms, lr: 8.234842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:47,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.65539 samples/s/p 2:35:12 } +2024-07-30 03:32:50,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2794/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 8.2322085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:50,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.65879 samples/s/p 2:35:03 } +2024-07-30 03:32:52,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2796/ 3125], loss: 0.398, per_step_time: 1412ms, lr: 8.22957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:52,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.66358 samples/s/p 2:34:53 } +2024-07-30 03:32:55,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2798/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 8.226932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:55,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.66066 samples/s/p 2:34:55 } +2024-07-30 03:32:58,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2800/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 8.224293e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:58,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.65824 samples/s/p 2:34:56 } +2024-07-30 03:32:58,651 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 03:33:33,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2802/ 3125], loss: 0.252, per_step_time: 2195ms, lr: 8.221651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:33,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 3.64457 samples/s/p 4:00:28 } +2024-07-30 03:33:36,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2804/ 3125], loss: 0.293, per_step_time: 1413ms, lr: 8.219007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:36,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.65897 samples/s/p 2:34:49 } +2024-07-30 03:33:39,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2806/ 3125], loss: 0.327, per_step_time: 1413ms, lr: 8.216363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:39,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.66098 samples/s/p 2:34:43 } +2024-07-30 03:33:42,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2808/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 8.213718e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:42,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.65911 samples/s/p 2:34:43 } +2024-07-30 03:33:44,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2810/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 8.211069e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:44,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.66028 samples/s/p 2:34:38 } +2024-07-30 03:33:47,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2812/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 8.208421e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:47,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.65777 samples/s/p 2:34:39 } +2024-07-30 03:33:50,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2814/ 3125], loss: 0.436, per_step_time: 1413ms, lr: 8.20577e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:50,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |███████████████ | 5.66109 samples/s/p 2:34:31 } +2024-07-30 03:33:53,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2816/ 3125], loss: 0.281, per_step_time: 1414ms, lr: 8.203118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:53,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |███████████████ | 5.65724 samples/s/p 2:34:35 } +2024-07-30 03:33:56,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2818/ 3125], loss: 0.163, per_step_time: 1416ms, lr: 8.200464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:56,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.64714 samples/s/p 2:34:48 } +2024-07-30 03:33:59,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2820/ 3125], loss: 0.291, per_step_time: 1412ms, lr: 8.19781e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:59,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.66275 samples/s/p 2:34:20 } +2024-07-30 03:34:02,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2822/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 8.195152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:02,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.66091 samples/s/p 2:34:20 } +2024-07-30 03:34:04,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2824/ 3125], loss: 0.480, per_step_time: 1412ms, lr: 8.1924945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:04,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.66299 samples/s/p 2:34:14 } +2024-07-30 03:34:07,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2826/ 3125], loss: 0.451, per_step_time: 1421ms, lr: 8.189835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:07,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.62823 samples/s/p 2:35:08 } +2024-07-30 03:34:10,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2828/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 8.187173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:10,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.65829 samples/s/p 2:34:16 } +2024-07-30 03:34:13,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2830/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 8.184512e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:13,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.66009 samples/s/p 2:34:10 } +2024-07-30 03:34:16,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2832/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 8.181846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:16,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.65890 samples/s/p 2:34:09 } +2024-07-30 03:34:19,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2834/ 3125], loss: 0.295, per_step_time: 1415ms, lr: 8.17918e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:19,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.65294 samples/s/p 2:34:16 } +2024-07-30 03:34:21,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2836/ 3125], loss: 0.293, per_step_time: 1412ms, lr: 8.176514e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:21,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.66231 samples/s/p 2:33:58 } +2024-07-30 03:34:24,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2838/ 3125], loss: 0.379, per_step_time: 1413ms, lr: 8.1738435e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:24,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.65928 samples/s/p 2:34:00 } +2024-07-30 03:34:27,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2840/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 8.171173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:27,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.65994 samples/s/p 2:33:56 } +2024-07-30 03:34:30,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2842/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.168502e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:30,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.65854 samples/s/p 2:33:56 } +2024-07-30 03:34:33,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2844/ 3125], loss: 0.376, per_step_time: 1413ms, lr: 8.165828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:33,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.66159 samples/s/p 2:33:48 } +2024-07-30 03:34:36,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2846/ 3125], loss: 0.265, per_step_time: 1414ms, lr: 8.163152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:36,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.65455 samples/s/p 2:33:57 } +2024-07-30 03:34:38,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2848/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 8.160477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:38,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.65926 samples/s/p 2:33:46 } +2024-07-30 03:34:41,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2850/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 8.157799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:41,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.65921 samples/s/p 2:33:43 } +2024-07-30 03:34:44,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2852/ 3125], loss: 0.294, per_step_time: 1425ms, lr: 8.155119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:44,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.61260 samples/s/p 2:34:57 } +2024-07-30 03:34:47,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2854/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 8.152439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:47,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.66092 samples/s/p 2:33:35 } +2024-07-30 03:34:50,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2856/ 3125], loss: 0.288, per_step_time: 1412ms, lr: 8.149756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:50,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.66191 samples/s/p 2:33:31 } +2024-07-30 03:34:53,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2858/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 8.147072e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:53,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.66097 samples/s/p 2:33:29 } +2024-07-30 03:34:55,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2860/ 3125], loss: 0.232, per_step_time: 1415ms, lr: 8.144387e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:55,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.65200 samples/s/p 2:33:41 } +2024-07-30 03:34:58,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2862/ 3125], loss: 0.199, per_step_time: 1415ms, lr: 8.1417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:58,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.65114 samples/s/p 2:33:40 } +2024-07-30 03:35:01,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2864/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 8.139012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:01,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.66062 samples/s/p 2:33:21 } +2024-07-30 03:35:04,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2866/ 3125], loss: 0.137, per_step_time: 1414ms, lr: 8.1363205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:04,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.65465 samples/s/p 2:33:28 } +2024-07-30 03:35:07,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2868/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 8.133629e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:07,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.66043 samples/s/p 2:33:16 } +2024-07-30 03:35:10,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2870/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 8.130936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:10,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.66033 samples/s/p 2:33:13 } +2024-07-30 03:35:13,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2872/ 3125], loss: 0.205, per_step_time: 1693ms, lr: 8.1282415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:13,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 4.72459 samples/s/p 3:03:31 } +2024-07-30 03:35:16,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2874/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 8.125546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:16,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.65960 samples/s/p 2:33:09 } +2024-07-30 03:35:19,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2876/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 8.122848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:19,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.65887 samples/s/p 2:33:07 } +2024-07-30 03:35:21,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2878/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 8.12015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:21,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.66072 samples/s/p 2:33:01 } +2024-07-30 03:35:24,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2880/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 8.117449e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:24,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.66060 samples/s/p 2:32:59 } +2024-07-30 03:35:27,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2882/ 3125], loss: 0.242, per_step_time: 1414ms, lr: 8.114746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:27,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.65720 samples/s/p 2:33:01 } +2024-07-30 03:35:30,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2884/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 8.112043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:30,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.66126 samples/s/p 2:32:52 } +2024-07-30 03:35:33,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2886/ 3125], loss: 0.262, per_step_time: 1415ms, lr: 8.109339e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:33,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.65084 samples/s/p 2:33:06 } +2024-07-30 03:35:36,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2888/ 3125], loss: 0.190, per_step_time: 1416ms, lr: 8.106633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:36,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.64655 samples/s/p 2:33:10 } +2024-07-30 03:35:38,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2890/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 8.103924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:38,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.65943 samples/s/p 2:32:47 } +2024-07-30 03:35:41,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2892/ 3125], loss: 0.357, per_step_time: 1414ms, lr: 8.101215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:41,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.65699 samples/s/p 2:32:48 } +2024-07-30 03:35:44,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2894/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 8.098505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:44,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.65990 samples/s/p 2:32:40 } +2024-07-30 03:35:47,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2896/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 8.0957925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:47,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.65800 samples/s/p 2:32:40 } +2024-07-30 03:35:50,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2898/ 3125], loss: 0.418, per_step_time: 1413ms, lr: 8.0930795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:50,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.65834 samples/s/p 2:32:37 } +2024-07-30 03:35:53,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2900/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 8.090362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:53,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.66142 samples/s/p 2:32:29 } +2024-07-30 03:35:55,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2902/ 3125], loss: 0.190, per_step_time: 1414ms, lr: 8.087645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:55,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.65477 samples/s/p 2:32:37 } +2024-07-30 03:35:58,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2904/ 3125], loss: 0.252, per_step_time: 1415ms, lr: 8.084929e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:58,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.65202 samples/s/p 2:32:39 } +2024-07-30 03:36:01,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2906/ 3125], loss: 0.262, per_step_time: 1412ms, lr: 8.082207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:01,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.66211 samples/s/p 2:32:20 } +2024-07-30 03:36:04,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2908/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 8.079487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:04,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.65875 samples/s/p 2:32:22 } +2024-07-30 03:36:07,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2910/ 3125], loss: 0.122, per_step_time: 1413ms, lr: 8.076764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:07,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.65885 samples/s/p 2:32:19 } +2024-07-30 03:36:10,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2912/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 8.07404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:10,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.66013 samples/s/p 2:32:14 } +2024-07-30 03:36:13,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2914/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 8.071315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:13,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.65939 samples/s/p 2:32:13 } +2024-07-30 03:36:15,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2916/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 8.068589e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:15,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.66051 samples/s/p 2:32:08 } +2024-07-30 03:36:18,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2918/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 8.065859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:18,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.65774 samples/s/p 2:32:10 } +2024-07-30 03:36:21,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2920/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 8.063129e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:21,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.66141 samples/s/p 2:32:01 } +2024-07-30 03:36:24,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2922/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 8.060398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:24,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.66043 samples/s/p 2:32:00 } +2024-07-30 03:36:27,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2924/ 3125], loss: 0.187, per_step_time: 1414ms, lr: 8.057666e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:27,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.65573 samples/s/p 2:32:04 } +2024-07-30 03:36:30,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2926/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 8.05493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:30,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.66093 samples/s/p 2:31:53 } +2024-07-30 03:36:32,840 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2928/ 3125], loss: 0.356, per_step_time: 1414ms, lr: 8.052194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:32,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.65755 samples/s/p 2:31:56 } +2024-07-30 03:36:35,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2930/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 8.049457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:35,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.65833 samples/s/p 2:31:52 } +2024-07-30 03:36:38,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2932/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 8.046719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:38,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.65955 samples/s/p 2:31:47 } +2024-07-30 03:36:41,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2934/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 8.043978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:41,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.66126 samples/s/p 2:31:41 } +2024-07-30 03:36:44,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2936/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 8.0412365e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:44,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.66132 samples/s/p 2:31:38 } +2024-07-30 03:36:47,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2938/ 3125], loss: 0.393, per_step_time: 1413ms, lr: 8.038493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:47,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.65987 samples/s/p 2:31:38 } +2024-07-30 03:36:49,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2940/ 3125], loss: 0.201, per_step_time: 1414ms, lr: 8.035749e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:49,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.65451 samples/s/p 2:31:44 } +2024-07-30 03:36:52,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2942/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 8.033003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:52,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.66052 samples/s/p 2:31:31 } +2024-07-30 03:36:55,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2944/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 8.030256e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:55,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.66006 samples/s/p 2:31:29 } +2024-07-30 03:36:58,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2946/ 3125], loss: 0.417, per_step_time: 1413ms, lr: 8.027507e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:58,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.65950 samples/s/p 2:31:27 } +2024-07-30 03:37:01,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2948/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 8.024756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:01,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.65994 samples/s/p 2:31:24 } +2024-07-30 03:37:04,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2950/ 3125], loss: 0.508, per_step_time: 1414ms, lr: 8.022005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:04,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.65731 samples/s/p 2:31:25 } +2024-07-30 03:37:06,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2952/ 3125], loss: 0.124, per_step_time: 1415ms, lr: 8.019252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:06,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.65208 samples/s/p 2:31:31 } +2024-07-30 03:37:09,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2954/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 8.016496e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:09,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.66030 samples/s/p 2:31:15 } +2024-07-30 03:37:12,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2956/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 8.013741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:12,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.66131 samples/s/p 2:31:10 } +2024-07-30 03:37:15,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2958/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 8.010983e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:15,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.65953 samples/s/p 2:31:10 } +2024-07-30 03:37:18,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2960/ 3125], loss: 0.058, per_step_time: 1413ms, lr: 8.008224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:18,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.66040 samples/s/p 2:31:06 } +2024-07-30 03:37:21,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2962/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 8.005464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:21,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.65894 samples/s/p 2:31:06 } +2024-07-30 03:37:23,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2964/ 3125], loss: 0.201, per_step_time: 1415ms, lr: 8.002702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:23,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.65344 samples/s/p 2:31:11 } +2024-07-30 03:37:26,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2966/ 3125], loss: 0.116, per_step_time: 1413ms, lr: 7.999938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:26,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.65957 samples/s/p 2:30:59 } +2024-07-30 03:37:29,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2968/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 7.997174e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:29,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.65996 samples/s/p 2:30:55 } +2024-07-30 03:37:32,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2970/ 3125], loss: 0.396, per_step_time: 1414ms, lr: 7.9944075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:32,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.65528 samples/s/p 2:31:00 } +2024-07-30 03:37:35,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2972/ 3125], loss: 0.248, per_step_time: 1414ms, lr: 7.991641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:35,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.65770 samples/s/p 2:30:53 } +2024-07-30 03:37:38,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2974/ 3125], loss: 0.402, per_step_time: 1415ms, lr: 7.988871e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:38,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.65228 samples/s/p 2:30:59 } +2024-07-30 03:37:40,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2976/ 3125], loss: 0.045, per_step_time: 1412ms, lr: 7.986101e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:40,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.66192 samples/s/p 2:30:41 } +2024-07-30 03:37:43,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2978/ 3125], loss: 0.486, per_step_time: 1413ms, lr: 7.983329e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:43,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.65840 samples/s/p 2:30:44 } +2024-07-30 03:37:46,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2980/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 7.980555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:46,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.66009 samples/s/p 2:30:38 } +2024-07-30 03:37:49,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2982/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 7.977781e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:49,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.66047 samples/s/p 2:30:35 } +2024-07-30 03:37:52,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2984/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 7.975005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:52,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.65986 samples/s/p 2:30:33 } +2024-07-30 03:37:55,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2986/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 7.972229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:55,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.66132 samples/s/p 2:30:28 } +2024-07-30 03:37:57,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2988/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 7.969448e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:57,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.65953 samples/s/p 2:30:28 } +2024-07-30 03:38:00,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2990/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 7.966668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:00,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.66102 samples/s/p 2:30:23 } +2024-07-30 03:38:03,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2992/ 3125], loss: 0.206, per_step_time: 1415ms, lr: 7.963886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:03,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.65364 samples/s/p 2:30:32 } +2024-07-30 03:38:06,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2994/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 7.961103e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:06,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.65686 samples/s/p 2:30:24 } +2024-07-30 03:38:09,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2996/ 3125], loss: 0.146, per_step_time: 1414ms, lr: 7.958318e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:09,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |███████████████ | 5.65739 samples/s/p 2:30:20 } +2024-07-30 03:38:12,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2998/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 7.955532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:12,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |███████████████ | 5.66054 samples/s/p 2:30:12 } +2024-07-30 03:38:14,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3000/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 7.952744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:14,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.65971 samples/s/p 2:30:11 } +2024-07-30 03:38:17,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3002/ 3125], loss: 0.105, per_step_time: 1413ms, lr: 7.949957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:17,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.65998 samples/s/p 2:30:07 } +2024-07-30 03:38:20,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3004/ 3125], loss: 0.164, per_step_time: 1413ms, lr: 7.9471665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:20,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.66008 samples/s/p 2:30:04 } +2024-07-30 03:38:23,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3006/ 3125], loss: 0.330, per_step_time: 1413ms, lr: 7.9443735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:23,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.66133 samples/s/p 2:30:00 } +2024-07-30 03:38:26,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3008/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 7.94158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:26,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.65964 samples/s/p 2:29:59 } +2024-07-30 03:38:29,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3010/ 3125], loss: 0.503, per_step_time: 1413ms, lr: 7.938786e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:29,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.66015 samples/s/p 2:29:56 } +2024-07-30 03:38:31,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3012/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 7.93599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:31,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.66097 samples/s/p 2:29:52 } +2024-07-30 03:38:34,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3014/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 7.933193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:34,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.65907 samples/s/p 2:29:52 } +2024-07-30 03:38:37,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3016/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 7.9303945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:37,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.66122 samples/s/p 2:29:46 } +2024-07-30 03:38:40,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3018/ 3125], loss: 0.073, per_step_time: 1413ms, lr: 7.927595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:40,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.66052 samples/s/p 2:29:44 } +2024-07-30 03:38:43,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3020/ 3125], loss: 0.311, per_step_time: 1415ms, lr: 7.924794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:43,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.65194 samples/s/p 2:29:55 } +2024-07-30 03:38:46,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3022/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 7.92199e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:46,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.65971 samples/s/p 2:29:39 } +2024-07-30 03:38:48,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3024/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 7.919186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:48,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.65998 samples/s/p 2:29:36 } +2024-07-30 03:38:51,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3026/ 3125], loss: 0.484, per_step_time: 1414ms, lr: 7.91638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:51,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.65661 samples/s/p 2:29:39 } +2024-07-30 03:38:54,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3028/ 3125], loss: 0.343, per_step_time: 1414ms, lr: 7.9135725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:54,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.65572 samples/s/p 2:29:37 } +2024-07-30 03:38:57,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3030/ 3125], loss: 0.262, per_step_time: 1414ms, lr: 7.910764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:57,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.65714 samples/s/p 2:29:32 } +2024-07-30 03:39:00,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3032/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 7.907955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:00,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.65772 samples/s/p 2:29:28 } +2024-07-30 03:39:03,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3034/ 3125], loss: 0.175, per_step_time: 1414ms, lr: 7.905143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:03,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.65425 samples/s/p 2:29:31 } +2024-07-30 03:39:05,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3036/ 3125], loss: 0.197, per_step_time: 1412ms, lr: 7.902331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:05,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.66207 samples/s/p 2:29:16 } +2024-07-30 03:39:08,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3038/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 7.899518e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:08,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.66110 samples/s/p 2:29:15 } +2024-07-30 03:39:11,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3040/ 3125], loss: 0.386, per_step_time: 1412ms, lr: 7.896702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:11,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.66366 samples/s/p 2:29:08 } +2024-07-30 03:39:14,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3042/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 7.893886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:14,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.65845 samples/s/p 2:29:13 } +2024-07-30 03:39:17,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3044/ 3125], loss: 0.133, per_step_time: 1412ms, lr: 7.891067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:17,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.66214 samples/s/p 2:29:05 } +2024-07-30 03:39:20,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3046/ 3125], loss: 0.483, per_step_time: 1413ms, lr: 7.888248e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:20,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.65978 samples/s/p 2:29:05 } +2024-07-30 03:39:22,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3048/ 3125], loss: 0.188, per_step_time: 1412ms, lr: 7.885426e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:22,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.66228 samples/s/p 2:28:59 } +2024-07-30 03:39:25,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3050/ 3125], loss: 0.253, per_step_time: 1412ms, lr: 7.882604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:25,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.66173 samples/s/p 2:28:57 } +2024-07-30 03:39:28,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3052/ 3125], loss: 0.170, per_step_time: 1412ms, lr: 7.87978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:28,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.66193 samples/s/p 2:28:54 } +2024-07-30 03:39:31,405 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3054/ 3125], loss: 0.430, per_step_time: 1413ms, lr: 7.876955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:31,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.66042 samples/s/p 2:28:53 } +2024-07-30 03:39:34,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3056/ 3125], loss: 0.063, per_step_time: 1412ms, lr: 7.874129e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:34,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.66181 samples/s/p 2:28:48 } +2024-07-30 03:39:37,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3058/ 3125], loss: 0.166, per_step_time: 1414ms, lr: 7.871301e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:37,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.65697 samples/s/p 2:28:53 } +2024-07-30 03:39:39,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3060/ 3125], loss: 0.244, per_step_time: 1412ms, lr: 7.8684725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:39,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.66294 samples/s/p 2:28:41 } +2024-07-30 03:39:42,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3062/ 3125], loss: 0.327, per_step_time: 1413ms, lr: 7.865641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:42,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.65987 samples/s/p 2:28:43 } +2024-07-30 03:39:45,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3064/ 3125], loss: 0.158, per_step_time: 1413ms, lr: 7.862808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:45,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.65932 samples/s/p 2:28:41 } +2024-07-30 03:39:48,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3066/ 3125], loss: 0.247, per_step_time: 1412ms, lr: 7.859976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:48,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.66330 samples/s/p 2:28:32 } +2024-07-30 03:39:51,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3068/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 7.857141e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:51,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.65920 samples/s/p 2:28:35 } +2024-07-30 03:39:54,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3070/ 3125], loss: 0.408, per_step_time: 1415ms, lr: 7.854305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:54,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.65256 samples/s/p 2:28:43 } +2024-07-30 03:39:56,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3072/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 7.851468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:56,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.66046 samples/s/p 2:28:28 } +2024-07-30 03:39:59,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3074/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 7.84863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:59,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.65943 samples/s/p 2:28:26 } +2024-07-30 03:40:02,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3076/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 7.845789e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:02,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.66146 samples/s/p 2:28:20 } +2024-07-30 03:40:05,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3078/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 7.842948e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:05,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.65944 samples/s/p 2:28:21 } +2024-07-30 03:40:08,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3080/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 7.840105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:08,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.65906 samples/s/p 2:28:19 } +2024-07-30 03:40:11,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3082/ 3125], loss: 0.274, per_step_time: 1414ms, lr: 7.8372605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:11,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.65575 samples/s/p 2:28:21 } +2024-07-30 03:40:13,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3084/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 7.834416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:13,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.65795 samples/s/p 2:28:15 } +2024-07-30 03:40:16,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3086/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 7.831569e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:16,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.66106 samples/s/p 2:28:07 } +2024-07-30 03:40:19,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3088/ 3125], loss: 0.198, per_step_time: 1412ms, lr: 7.82872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:19,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.66205 samples/s/p 2:28:03 } +2024-07-30 03:40:22,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3090/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 7.825871e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:22,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.66035 samples/s/p 2:28:02 } +2024-07-30 03:40:25,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3092/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 7.82302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:25,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.65943 samples/s/p 2:28:01 } +2024-07-30 03:40:28,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3094/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 7.820167e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:28,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.65904 samples/s/p 2:27:59 } +2024-07-30 03:40:30,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3096/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 7.817314e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:30,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.65927 samples/s/p 2:27:56 } +2024-07-30 03:40:33,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3098/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 7.814459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:33,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.65904 samples/s/p 2:27:53 } +2024-07-30 03:40:36,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3100/ 3125], loss: 0.094, per_step_time: 1413ms, lr: 7.811602e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:36,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.66065 samples/s/p 2:27:48 } +2024-07-30 03:40:39,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3102/ 3125], loss: 0.340, per_step_time: 1414ms, lr: 7.808745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:39,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.65750 samples/s/p 2:27:50 } +2024-07-30 03:40:42,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3104/ 3125], loss: 0.542, per_step_time: 1414ms, lr: 7.8058865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:42,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.65489 samples/s/p 2:27:51 } +2024-07-30 03:40:45,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3106/ 3125], loss: 0.421, per_step_time: 1413ms, lr: 7.803026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:45,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.66146 samples/s/p 2:27:38 } +2024-07-30 03:40:47,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3108/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 7.800165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:47,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.65926 samples/s/p 2:27:39 } +2024-07-30 03:40:50,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3110/ 3125], loss: 0.137, per_step_time: 1413ms, lr: 7.797301e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:50,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.66124 samples/s/p 2:27:33 } +2024-07-30 03:40:53,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3112/ 3125], loss: 0.390, per_step_time: 1413ms, lr: 7.794437e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:53,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.66098 samples/s/p 2:27:30 } +2024-07-30 03:40:56,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3114/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 7.791571e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:56,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.66069 samples/s/p 2:27:28 } +2024-07-30 03:40:59,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3116/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 7.788703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:59,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.65967 samples/s/p 2:27:27 } +2024-07-30 03:41:02,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3118/ 3125], loss: 0.107, per_step_time: 1413ms, lr: 7.785835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:02,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.65952 samples/s/p 2:27:24 } +2024-07-30 03:41:04,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3120/ 3125], loss: 0.323, per_step_time: 1414ms, lr: 7.782965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:04,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.65756 samples/s/p 2:27:24 } +2024-07-30 03:41:07,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3122/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 7.780095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:07,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.65886 samples/s/p 2:27:19 } +2024-07-30 03:41:10,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3124/ 3125], loss: 0.356, per_step_time: 1413ms, lr: 7.777224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:10,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.65884 samples/s/p 2:27:17 } +2024-07-30 03:41:13,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 7.774349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:13,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.65797 samples/s/p 2:27:15 } +2024-07-30 03:41:16,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 7.771474e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:16,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.65884 samples/s/p 2:27:11 } +2024-07-30 03:41:19,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 5/ 3125], loss: 0.122, per_step_time: 1413ms, lr: 7.768598e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:19,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.65846 samples/s/p 2:27:09 } +2024-07-30 03:41:21,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 7/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 7.7657205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:21,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.66091 samples/s/p 2:27:02 } +2024-07-30 03:41:24,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 9/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 7.762842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:24,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.65852 samples/s/p 2:27:03 } +2024-07-30 03:41:27,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 11/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 7.759961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:27,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.65839 samples/s/p 2:27:00 } +2024-07-30 03:41:30,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 13/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 7.757079e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:30,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.66089 samples/s/p 2:26:54 } +2024-07-30 03:41:33,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 15/ 3125], loss: 0.090, per_step_time: 1412ms, lr: 7.754197e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:33,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.66195 samples/s/p 2:26:49 } +2024-07-30 03:41:36,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 17/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 7.751312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:36,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.65975 samples/s/p 2:26:50 } +2024-07-30 03:41:38,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 19/ 3125], loss: 0.346, per_step_time: 1412ms, lr: 7.748427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:38,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.66214 samples/s/p 2:26:43 } +2024-07-30 03:41:41,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 21/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 7.74554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:41,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.66036 samples/s/p 2:26:43 } +2024-07-30 03:41:44,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 23/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 7.742651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:44,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.66088 samples/s/p 2:26:40 } +2024-07-30 03:41:47,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 25/ 3125], loss: 0.442, per_step_time: 1413ms, lr: 7.739762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:47,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.65809 samples/s/p 2:26:41 } +2024-07-30 03:41:50,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 27/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 7.736871e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:50,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.65942 samples/s/p 2:26:36 } +2024-07-30 03:41:53,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 29/ 3125], loss: 0.158, per_step_time: 1412ms, lr: 7.733979e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:53,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.66178 samples/s/p 2:26:30 } +2024-07-30 03:41:55,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 31/ 3125], loss: 0.160, per_step_time: 1413ms, lr: 7.731086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:55,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.66139 samples/s/p 2:26:27 } +2024-07-30 03:41:58,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 33/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 7.728191e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:58,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.66036 samples/s/p 2:26:26 } +2024-07-30 03:42:01,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 35/ 3125], loss: 0.050, per_step_time: 1413ms, lr: 7.725296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:01,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.66091 samples/s/p 2:26:23 } +2024-07-30 03:42:04,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 37/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 7.7223995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:04,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.66012 samples/s/p 2:26:21 } +2024-07-30 03:42:07,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 39/ 3125], loss: 0.476, per_step_time: 1413ms, lr: 7.7195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:07,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.65896 samples/s/p 2:26:20 } +2024-07-30 03:42:10,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 41/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 7.7166005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:10,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.66053 samples/s/p 2:26:15 } +2024-07-30 03:42:12,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 43/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 7.713699e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:12,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.66094 samples/s/p 2:26:11 } +2024-07-30 03:42:15,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 45/ 3125], loss: 0.356, per_step_time: 1413ms, lr: 7.710796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:15,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.66003 samples/s/p 2:26:10 } +2024-07-30 03:42:18,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 47/ 3125], loss: 0.262, per_step_time: 1414ms, lr: 7.707892e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:18,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.65691 samples/s/p 2:26:12 } +2024-07-30 03:42:21,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 49/ 3125], loss: 0.134, per_step_time: 1415ms, lr: 7.704987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:21,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.65317 samples/s/p 2:26:15 } +2024-07-30 03:42:24,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 51/ 3125], loss: 0.254, per_step_time: 1414ms, lr: 7.702081e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:24,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.65424 samples/s/p 2:26:10 } +2024-07-30 03:42:27,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 53/ 3125], loss: 0.330, per_step_time: 1414ms, lr: 7.699174e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:27,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.65654 samples/s/p 2:26:04 } +2024-07-30 03:42:29,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 55/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 7.696265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:29,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.66111 samples/s/p 2:25:54 } +2024-07-30 03:42:32,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 57/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 7.693354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:32,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.66137 samples/s/p 2:25:51 } +2024-07-30 03:42:35,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 59/ 3125], loss: 0.539, per_step_time: 1413ms, lr: 7.6904425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:35,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |████████████████ | 5.66165 samples/s/p 2:25:47 } +2024-07-30 03:42:38,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 61/ 3125], loss: 0.441, per_step_time: 1413ms, lr: 7.687529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:38,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |████████████████ | 5.65803 samples/s/p 2:25:50 } +2024-07-30 03:42:41,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 63/ 3125], loss: 0.299, per_step_time: 1414ms, lr: 7.684615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:41,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.65771 samples/s/p 2:25:48 } +2024-07-30 03:42:44,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 65/ 3125], loss: 0.268, per_step_time: 1412ms, lr: 7.6817005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:44,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.66216 samples/s/p 2:25:38 } +2024-07-30 03:42:46,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 67/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 7.678784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:46,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.65866 samples/s/p 2:25:41 } +2024-07-30 03:42:49,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 69/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 7.675866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:49,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.65864 samples/s/p 2:25:38 } +2024-07-30 03:42:52,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 71/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 7.6729475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:52,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.65961 samples/s/p 2:25:34 } +2024-07-30 03:42:55,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 73/ 3125], loss: 0.266, per_step_time: 1425ms, lr: 7.670027e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:55,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.61308 samples/s/p 2:26:43 } +2024-07-30 03:42:58,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 75/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 7.667105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:58,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.66090 samples/s/p 2:25:26 } +2024-07-30 03:43:01,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 77/ 3125], loss: 0.197, per_step_time: 1413ms, lr: 7.664182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:01,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.65963 samples/s/p 2:25:25 } +2024-07-30 03:43:03,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 79/ 3125], loss: 0.398, per_step_time: 1413ms, lr: 7.661257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:03,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.66016 samples/s/p 2:25:22 } +2024-07-30 03:43:06,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 81/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 7.658331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:06,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.66091 samples/s/p 2:25:18 } +2024-07-30 03:43:09,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 83/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 7.655404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:09,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.66130 samples/s/p 2:25:14 } +2024-07-30 03:43:12,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 85/ 3125], loss: 0.280, per_step_time: 1412ms, lr: 7.652477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:12,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.66224 samples/s/p 2:25:10 } +2024-07-30 03:43:15,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 87/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 7.649548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:15,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.66046 samples/s/p 2:25:10 } +2024-07-30 03:43:18,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 89/ 3125], loss: 0.140, per_step_time: 1412ms, lr: 7.646618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:18,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.66206 samples/s/p 2:25:04 } +2024-07-30 03:43:20,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 91/ 3125], loss: 0.132, per_step_time: 1412ms, lr: 7.643685e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:20,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.66172 samples/s/p 2:25:02 } +2024-07-30 03:43:23,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 93/ 3125], loss: 0.460, per_step_time: 1413ms, lr: 7.640752e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:23,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.65918 samples/s/p 2:25:03 } +2024-07-30 03:43:26,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 95/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 7.637817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:26,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.66125 samples/s/p 2:24:57 } +2024-07-30 03:43:29,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 97/ 3125], loss: 0.124, per_step_time: 1413ms, lr: 7.6348815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:29,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.66117 samples/s/p 2:24:55 } +2024-07-30 03:43:32,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 99/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 7.631944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:32,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.65950 samples/s/p 2:24:54 } +2024-07-30 03:43:35,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 101/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 7.629007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:35,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.65819 samples/s/p 2:24:53 } +2024-07-30 03:43:37,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 103/ 3125], loss: 0.317, per_step_time: 1414ms, lr: 7.626067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:37,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.65759 samples/s/p 2:24:52 } +2024-07-30 03:43:40,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 105/ 3125], loss: 0.223, per_step_time: 1414ms, lr: 7.6231267e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:40,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.65738 samples/s/p 2:24:49 } +2024-07-30 03:43:43,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 107/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 7.6201854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:43,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.65731 samples/s/p 2:24:46 } +2024-07-30 03:43:46,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 109/ 3125], loss: 0.124, per_step_time: 1413ms, lr: 7.6172423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:46,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.65967 samples/s/p 2:24:40 } +2024-07-30 03:43:49,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 111/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 7.614297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:49,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.65917 samples/s/p 2:24:38 } +2024-07-30 03:43:52,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 113/ 3125], loss: 0.330, per_step_time: 1413ms, lr: 7.6113506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:52,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.65948 samples/s/p 2:24:34 } +2024-07-30 03:43:54,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 115/ 3125], loss: 0.049, per_step_time: 1412ms, lr: 7.608404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:54,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.66242 samples/s/p 2:24:27 } +2024-07-30 03:43:57,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 117/ 3125], loss: 0.554, per_step_time: 1413ms, lr: 7.6054557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:57,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.65877 samples/s/p 2:24:30 } +2024-07-30 03:44:00,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 119/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 7.6025067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:00,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.66095 samples/s/p 2:24:24 } +2024-07-30 03:44:03,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 121/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 7.5995563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:03,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.66132 samples/s/p 2:24:20 } +2024-07-30 03:44:06,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 123/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 7.5966045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:06,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.65963 samples/s/p 2:24:20 } +2024-07-30 03:44:09,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 125/ 3125], loss: 0.255, per_step_time: 1414ms, lr: 7.5936505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:09,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.65629 samples/s/p 2:24:22 } +2024-07-30 03:44:12,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 127/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 7.5906964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:12,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.65974 samples/s/p 2:24:14 } +2024-07-30 03:44:14,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 129/ 3125], loss: 0.126, per_step_time: 1414ms, lr: 7.5877415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:14,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.65702 samples/s/p 2:24:16 } +2024-07-30 03:44:17,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 131/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 7.5847843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:17,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.66038 samples/s/p 2:24:08 } +2024-07-30 03:44:20,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 133/ 3125], loss: 0.160, per_step_time: 1414ms, lr: 7.5818257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:20,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.65744 samples/s/p 2:24:09 } +2024-07-30 03:44:23,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 135/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 7.578866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:23,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.65891 samples/s/p 2:24:04 } +2024-07-30 03:44:26,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 137/ 3125], loss: 0.145, per_step_time: 1413ms, lr: 7.5759062e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:26,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.65844 samples/s/p 2:24:02 } +2024-07-30 03:44:29,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 139/ 3125], loss: 0.216, per_step_time: 1415ms, lr: 7.5729445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:29,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.65354 samples/s/p 2:24:07 } +2024-07-30 03:44:31,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 141/ 3125], loss: 0.128, per_step_time: 1412ms, lr: 7.569982e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:31,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.66177 samples/s/p 2:23:51 } +2024-07-30 03:44:34,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 143/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 7.567018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:34,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.65847 samples/s/p 2:23:54 } +2024-07-30 03:44:37,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 145/ 3125], loss: 0.406, per_step_time: 1412ms, lr: 7.5640514e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:37,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.66287 samples/s/p 2:23:44 } +2024-07-30 03:44:40,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 147/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 7.5610837e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:40,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.65985 samples/s/p 2:23:46 } +2024-07-30 03:44:43,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 149/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 7.5581165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:43,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.66120 samples/s/p 2:23:41 } +2024-07-30 03:44:46,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 151/ 3125], loss: 0.153, per_step_time: 1412ms, lr: 7.555147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:46,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.66259 samples/s/p 2:23:36 } +2024-07-30 03:44:48,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 153/ 3125], loss: 0.151, per_step_time: 1413ms, lr: 7.5521775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:48,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.65936 samples/s/p 2:23:38 } +2024-07-30 03:44:51,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 155/ 3125], loss: 0.485, per_step_time: 1412ms, lr: 7.5492057e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:51,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.66242 samples/s/p 2:23:31 } +2024-07-30 03:44:54,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 157/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 7.5462335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:54,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.66006 samples/s/p 2:23:31 } +2024-07-30 03:44:57,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 159/ 3125], loss: 0.145, per_step_time: 1412ms, lr: 7.5432595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:57,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.66314 samples/s/p 2:23:24 } +2024-07-30 03:45:00,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 161/ 3125], loss: 0.241, per_step_time: 1412ms, lr: 7.5402836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:00,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.66301 samples/s/p 2:23:21 } +2024-07-30 03:45:03,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 163/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 7.5373077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:03,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.65934 samples/s/p 2:23:24 } +2024-07-30 03:45:05,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 165/ 3125], loss: 0.220, per_step_time: 1419ms, lr: 7.5343296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:05,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.63672 samples/s/p 2:23:56 } +2024-07-30 03:45:08,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 167/ 3125], loss: 0.382, per_step_time: 1413ms, lr: 7.5313505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:08,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.65934 samples/s/p 2:23:18 } +2024-07-30 03:45:11,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 169/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 7.5283706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:11,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.66131 samples/s/p 2:23:13 } +2024-07-30 03:45:14,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 171/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 7.525389e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:14,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.66131 samples/s/p 2:23:10 } +2024-07-30 03:45:17,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 173/ 3125], loss: 0.153, per_step_time: 1414ms, lr: 7.522407e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:17,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.65576 samples/s/p 2:23:15 } +2024-07-30 03:45:20,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 175/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 7.519424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:20,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.66046 samples/s/p 2:23:05 } +2024-07-30 03:45:22,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 177/ 3125], loss: 0.129, per_step_time: 1413ms, lr: 7.516439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:22,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.66087 samples/s/p 2:23:02 } +2024-07-30 03:45:25,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 179/ 3125], loss: 0.139, per_step_time: 1414ms, lr: 7.5134526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:25,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.65498 samples/s/p 2:23:08 } +2024-07-30 03:45:28,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 181/ 3125], loss: 0.536, per_step_time: 1413ms, lr: 7.5104654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:28,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.66015 samples/s/p 2:22:57 } +2024-07-30 03:45:31,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 183/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 7.5074754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:31,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.65877 samples/s/p 2:22:57 } +2024-07-30 03:45:34,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 185/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 7.5044863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:34,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.66112 samples/s/p 2:22:50 } +2024-07-30 03:45:37,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 187/ 3125], loss: 0.253, per_step_time: 1414ms, lr: 7.501496e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:37,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.65749 samples/s/p 2:22:53 } +2024-07-30 03:45:39,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 189/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 7.4985037e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:39,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.65819 samples/s/p 2:22:49 } +2024-07-30 03:45:42,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 191/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 7.495511e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:42,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.65875 samples/s/p 2:22:45 } +2024-07-30 03:45:45,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 193/ 3125], loss: 0.382, per_step_time: 1413ms, lr: 7.4925165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:45,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.65774 samples/s/p 2:22:44 } +2024-07-30 03:45:48,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 195/ 3125], loss: 0.408, per_step_time: 1413ms, lr: 7.4895215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:48,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.65846 samples/s/p 2:22:40 } +2024-07-30 03:45:51,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 197/ 3125], loss: 0.272, per_step_time: 1417ms, lr: 7.4865234e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:51,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.64427 samples/s/p 2:22:59 } +2024-07-30 03:45:54,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 199/ 3125], loss: 0.393, per_step_time: 1414ms, lr: 7.4835257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:54,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.65673 samples/s/p 2:22:37 } +2024-07-30 03:45:56,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 201/ 3125], loss: 0.027, per_step_time: 1414ms, lr: 7.4805257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:56,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.65747 samples/s/p 2:22:33 } +2024-07-30 03:45:59,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 203/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 7.4775253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:59,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.66115 samples/s/p 2:22:25 } +2024-07-30 03:46:02,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 205/ 3125], loss: 0.199, per_step_time: 1414ms, lr: 7.4745244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:02,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.65667 samples/s/p 2:22:29 } +2024-07-30 03:46:05,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 207/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 7.4715217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:05,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.66055 samples/s/p 2:22:20 } +2024-07-30 03:46:08,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 209/ 3125], loss: 0.076, per_step_time: 1413ms, lr: 7.4685177e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:08,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.66135 samples/s/p 2:22:16 } +2024-07-30 03:46:11,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 211/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 7.465513e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:11,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.66012 samples/s/p 2:22:15 } +2024-07-30 03:46:13,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 213/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 7.462506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:13,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.65900 samples/s/p 2:22:14 } +2024-07-30 03:46:16,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 215/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 7.4594986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:16,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.66151 samples/s/p 2:22:07 } +2024-07-30 03:46:19,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 217/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 7.45649e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:19,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.66011 samples/s/p 2:22:07 } +2024-07-30 03:46:22,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 219/ 3125], loss: 0.121, per_step_time: 1412ms, lr: 7.4534796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:22,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.66214 samples/s/p 2:22:01 } +2024-07-30 03:46:25,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 221/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 7.4504687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:25,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.66165 samples/s/p 2:21:59 } +2024-07-30 03:46:28,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 223/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 7.447457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:28,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.66104 samples/s/p 2:21:57 } +2024-07-30 03:46:30,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 225/ 3125], loss: 0.200, per_step_time: 1412ms, lr: 7.4444433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:30,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.66235 samples/s/p 2:21:52 } +2024-07-30 03:46:33,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 227/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 7.4414297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:33,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.65920 samples/s/p 2:21:54 } +2024-07-30 03:46:36,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 229/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 7.438414e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:36,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.66108 samples/s/p 2:21:48 } +2024-07-30 03:46:39,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 231/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 7.4353975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:39,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.66034 samples/s/p 2:21:46 } +2024-07-30 03:46:42,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 233/ 3125], loss: 0.202, per_step_time: 1416ms, lr: 7.432379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:42,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.64863 samples/s/p 2:22:01 } +2024-07-30 03:46:45,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 235/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 7.429359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:45,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.65852 samples/s/p 2:21:43 } +2024-07-30 03:46:47,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 237/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 7.4263385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:47,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.65937 samples/s/p 2:21:39 } +2024-07-30 03:46:50,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 239/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 7.423317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:50,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.66054 samples/s/p 2:21:35 } +2024-07-30 03:46:53,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 241/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 7.4202953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:53,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.66112 samples/s/p 2:21:31 } +2024-07-30 03:46:56,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 243/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 7.4172717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:56,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.65829 samples/s/p 2:21:33 } +2024-07-30 03:46:59,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 245/ 3125], loss: 0.160, per_step_time: 1416ms, lr: 7.4142467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:59,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.64629 samples/s/p 2:21:48 } +2024-07-30 03:47:02,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 247/ 3125], loss: 0.308, per_step_time: 1414ms, lr: 7.4112213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:02,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |█████████████████ | 5.65488 samples/s/p 2:21:32 } +2024-07-30 03:47:04,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 249/ 3125], loss: 0.176, per_step_time: 1413ms, lr: 7.408193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:04,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |█████████████████ | 5.65927 samples/s/p 2:21:23 } +2024-07-30 03:47:07,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 251/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 7.4051645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:07,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.66166 samples/s/p 2:21:16 } +2024-07-30 03:47:10,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 253/ 3125], loss: 0.345, per_step_time: 1415ms, lr: 7.4021355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:10,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.65156 samples/s/p 2:21:28 } +2024-07-30 03:47:13,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 255/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 7.399104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:13,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.66008 samples/s/p 2:21:13 } +2024-07-30 03:47:16,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 257/ 3125], loss: 0.124, per_step_time: 1414ms, lr: 7.396072e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:16,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.65753 samples/s/p 2:21:14 } +2024-07-30 03:47:19,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 259/ 3125], loss: 0.261, per_step_time: 1415ms, lr: 7.393039e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:19,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.65251 samples/s/p 2:21:19 } +2024-07-30 03:47:21,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 261/ 3125], loss: 0.369, per_step_time: 1414ms, lr: 7.3900055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:21,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.65753 samples/s/p 2:21:08 } +2024-07-30 03:47:24,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 263/ 3125], loss: 0.533, per_step_time: 1414ms, lr: 7.3869705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:24,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.65715 samples/s/p 2:21:06 } +2024-07-30 03:47:27,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 265/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 7.383934e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:27,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.66098 samples/s/p 2:20:57 } +2024-07-30 03:47:30,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 267/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 7.380896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:30,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.65914 samples/s/p 2:20:57 } +2024-07-30 03:47:33,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 269/ 3125], loss: 0.090, per_step_time: 1413ms, lr: 7.377857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:33,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.65981 samples/s/p 2:20:53 } +2024-07-30 03:47:36,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 271/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 7.374817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:36,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.66048 samples/s/p 2:20:50 } +2024-07-30 03:47:38,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 273/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 7.371776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:38,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.65842 samples/s/p 2:20:50 } +2024-07-30 03:47:41,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 275/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 7.3687343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:41,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.65827 samples/s/p 2:20:47 } +2024-07-30 03:47:44,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 277/ 3125], loss: 0.285, per_step_time: 1412ms, lr: 7.3656915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:44,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.66180 samples/s/p 2:20:39 } +2024-07-30 03:47:47,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 279/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 7.3626475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:47,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.65781 samples/s/p 2:20:42 } +2024-07-30 03:47:50,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 281/ 3125], loss: 0.255, per_step_time: 1414ms, lr: 7.3596025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:50,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.65726 samples/s/p 2:20:40 } +2024-07-30 03:47:53,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 283/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 7.3565557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:53,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.65892 samples/s/p 2:20:35 } +2024-07-30 03:47:55,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 285/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 7.353507e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:55,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.66164 samples/s/p 2:20:28 } +2024-07-30 03:47:58,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 287/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 7.350459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:58,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.65833 samples/s/p 2:20:30 } +2024-07-30 03:48:01,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 289/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 7.347408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:01,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.66096 samples/s/p 2:20:24 } +2024-07-30 03:48:04,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 291/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 7.344357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:04,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.66052 samples/s/p 2:20:21 } +2024-07-30 03:48:07,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 293/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 7.341305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:07,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.65980 samples/s/p 2:20:20 } +2024-07-30 03:48:10,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 295/ 3125], loss: 0.137, per_step_time: 1413ms, lr: 7.338252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:10,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.65831 samples/s/p 2:20:19 } +2024-07-30 03:48:12,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 297/ 3125], loss: 0.263, per_step_time: 1412ms, lr: 7.3351976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:12,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.66235 samples/s/p 2:20:10 } +2024-07-30 03:48:15,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 299/ 3125], loss: 0.336, per_step_time: 1412ms, lr: 7.3321426e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:15,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.66256 samples/s/p 2:20:07 } +2024-07-30 03:48:18,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 301/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 7.329085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:18,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.66042 samples/s/p 2:20:07 } +2024-07-30 03:48:21,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 303/ 3125], loss: 0.321, per_step_time: 1413ms, lr: 7.3260276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:21,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.65902 samples/s/p 2:20:07 } +2024-07-30 03:48:24,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 305/ 3125], loss: 0.338, per_step_time: 1425ms, lr: 7.3229676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:24,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.61295 samples/s/p 2:21:13 } +2024-07-30 03:48:27,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 307/ 3125], loss: 0.191, per_step_time: 1414ms, lr: 7.319908e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:27,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.65379 samples/s/p 2:20:09 } +2024-07-30 03:48:29,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 309/ 3125], loss: 0.320, per_step_time: 1413ms, lr: 7.3168467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:29,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.66079 samples/s/p 2:19:55 } +2024-07-30 03:48:32,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 311/ 3125], loss: 0.349, per_step_time: 1414ms, lr: 7.313785e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:32,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.65711 samples/s/p 2:19:58 } +2024-07-30 03:48:35,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 313/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 7.3107217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:35,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.66017 samples/s/p 2:19:51 } +2024-07-30 03:48:38,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 315/ 3125], loss: 0.327, per_step_time: 1413ms, lr: 7.307658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:38,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.66089 samples/s/p 2:19:47 } +2024-07-30 03:48:41,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 317/ 3125], loss: 0.287, per_step_time: 1415ms, lr: 7.3045926e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:41,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.65160 samples/s/p 2:19:58 } +2024-07-30 03:48:44,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 319/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 7.301526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:44,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.66137 samples/s/p 2:19:41 } +2024-07-30 03:48:47,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 321/ 3125], loss: 0.260, per_step_time: 1414ms, lr: 7.2984576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:47,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.65473 samples/s/p 2:19:48 } +2024-07-30 03:48:49,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 323/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 7.2953876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:49,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.66074 samples/s/p 2:19:36 } +2024-07-30 03:48:52,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 325/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 7.292318e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:52,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.66145 samples/s/p 2:19:32 } +2024-07-30 03:48:55,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 327/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 7.289247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:55,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.65992 samples/s/p 2:19:31 } +2024-07-30 03:48:58,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 329/ 3125], loss: 0.272, per_step_time: 1414ms, lr: 7.2861753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:58,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.65746 samples/s/p 2:19:32 } +2024-07-30 03:49:01,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 331/ 3125], loss: 0.421, per_step_time: 1412ms, lr: 7.2831026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:01,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.66267 samples/s/p 2:19:22 } +2024-07-30 03:49:04,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 333/ 3125], loss: 0.387, per_step_time: 1413ms, lr: 7.280029e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:04,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.66113 samples/s/p 2:19:21 } +2024-07-30 03:49:06,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 335/ 3125], loss: 0.218, per_step_time: 1412ms, lr: 7.2769526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:06,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.66419 samples/s/p 2:19:14 } +2024-07-30 03:49:09,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 337/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 7.2738767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:09,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.65911 samples/s/p 2:19:18 } +2024-07-30 03:49:12,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 339/ 3125], loss: 0.399, per_step_time: 1413ms, lr: 7.270799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:12,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.65921 samples/s/p 2:19:15 } +2024-07-30 03:49:15,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 341/ 3125], loss: 0.279, per_step_time: 1415ms, lr: 7.2677194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:15,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.65192 samples/s/p 2:19:23 } +2024-07-30 03:49:18,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 343/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 7.2646403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:18,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.66067 samples/s/p 2:19:08 } +2024-07-30 03:49:21,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 345/ 3125], loss: 0.253, per_step_time: 1414ms, lr: 7.2615594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:21,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.65721 samples/s/p 2:19:10 } +2024-07-30 03:49:23,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 347/ 3125], loss: 0.124, per_step_time: 1414ms, lr: 7.2584776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:23,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.65714 samples/s/p 2:19:07 } +2024-07-30 03:49:26,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 349/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 7.255395e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:26,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.65919 samples/s/p 2:19:01 } +2024-07-30 03:49:29,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 351/ 3125], loss: 0.398, per_step_time: 1412ms, lr: 7.2523117e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:29,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.66174 samples/s/p 2:18:55 } +2024-07-30 03:49:32,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 353/ 3125], loss: 0.160, per_step_time: 1414ms, lr: 7.249226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:32,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.65634 samples/s/p 2:19:00 } +2024-07-30 03:49:35,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 355/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 7.2461407e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:35,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.66007 samples/s/p 2:18:52 } +2024-07-30 03:49:38,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 357/ 3125], loss: 0.162, per_step_time: 1415ms, lr: 7.2430526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:38,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.65337 samples/s/p 2:18:59 } +2024-07-30 03:49:40,858 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 359/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 7.2399635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:40,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.65982 samples/s/p 2:18:46 } +2024-07-30 03:49:43,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 361/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 7.236874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:43,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.65374 samples/s/p 2:18:52 } +2024-07-30 03:49:46,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 363/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 7.233784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:46,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.66142 samples/s/p 2:18:38 } +2024-07-30 03:49:49,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 365/ 3125], loss: 0.235, per_step_time: 1412ms, lr: 7.230693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:49,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.66177 samples/s/p 2:18:35 } +2024-07-30 03:49:52,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 367/ 3125], loss: 0.042, per_step_time: 1413ms, lr: 7.2276007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:52,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.66166 samples/s/p 2:18:32 } +2024-07-30 03:49:55,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 369/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 7.224507e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:55,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.66044 samples/s/p 2:18:31 } +2024-07-30 03:49:57,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 371/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 7.221411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:57,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.66006 samples/s/p 2:18:29 } +2024-07-30 03:50:00,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 373/ 3125], loss: 0.220, per_step_time: 1418ms, lr: 7.218316e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:00,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.63992 samples/s/p 2:18:56 } +2024-07-30 03:50:03,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 375/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 7.215219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:03,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.66103 samples/s/p 2:18:22 } +2024-07-30 03:50:06,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 377/ 3125], loss: 0.310, per_step_time: 1415ms, lr: 7.21212e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:06,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.65096 samples/s/p 2:18:34 } +2024-07-30 03:50:09,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 379/ 3125], loss: 0.083, per_step_time: 1412ms, lr: 7.209022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:09,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.66299 samples/s/p 2:18:13 } +2024-07-30 03:50:12,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 381/ 3125], loss: 0.318, per_step_time: 1412ms, lr: 7.205922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:12,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.66210 samples/s/p 2:18:12 } +2024-07-30 03:50:14,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 383/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 7.202821e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:14,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.66021 samples/s/p 2:18:12 } +2024-07-30 03:50:17,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 385/ 3125], loss: 0.288, per_step_time: 1414ms, lr: 7.199719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:17,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.65694 samples/s/p 2:18:14 } +2024-07-30 03:50:20,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 387/ 3125], loss: 0.111, per_step_time: 1414ms, lr: 7.1966165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:20,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.65769 samples/s/p 2:18:10 } +2024-07-30 03:50:23,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 389/ 3125], loss: 0.102, per_step_time: 1415ms, lr: 7.193513e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:23,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.65127 samples/s/p 2:18:16 } +2024-07-30 03:50:26,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 391/ 3125], loss: 0.454, per_step_time: 1413ms, lr: 7.190406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:26,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.65957 samples/s/p 2:18:01 } +2024-07-30 03:50:29,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 393/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 7.1872996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:29,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.66015 samples/s/p 2:17:58 } +2024-07-30 03:50:31,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 395/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 7.184192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:31,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.66123 samples/s/p 2:17:53 } +2024-07-30 03:50:34,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 397/ 3125], loss: 0.102, per_step_time: 1413ms, lr: 7.181084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:34,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.65940 samples/s/p 2:17:53 } +2024-07-30 03:50:37,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 399/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 7.177975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:37,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.66116 samples/s/p 2:17:48 } +2024-07-30 03:50:40,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 401/ 3125], loss: 0.318, per_step_time: 1412ms, lr: 7.174864e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:40,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.66290 samples/s/p 2:17:42 } +2024-07-30 03:50:43,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 403/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 7.1717536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:43,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.65879 samples/s/p 2:17:46 } +2024-07-30 03:50:46,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 405/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 7.168641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:46,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.66005 samples/s/p 2:17:41 } +2024-07-30 03:50:48,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 407/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 7.1655268e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:48,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.65906 samples/s/p 2:17:40 } +2024-07-30 03:50:51,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 409/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 7.162412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:51,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.65919 samples/s/p 2:17:37 } +2024-07-30 03:50:54,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 411/ 3125], loss: 0.375, per_step_time: 1412ms, lr: 7.1592967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:54,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.66269 samples/s/p 2:17:29 } +2024-07-30 03:50:57,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 413/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 7.1561794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:57,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.66050 samples/s/p 2:17:29 } +2024-07-30 03:51:00,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 415/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 7.1530612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:00,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.66089 samples/s/p 2:17:26 } +2024-07-30 03:51:03,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 417/ 3125], loss: 0.052, per_step_time: 1413ms, lr: 7.149943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:03,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.66032 samples/s/p 2:17:24 } +2024-07-30 03:51:05,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 419/ 3125], loss: 0.373, per_step_time: 1413ms, lr: 7.146824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:05,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.66146 samples/s/p 2:17:19 } +2024-07-30 03:51:08,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 421/ 3125], loss: 0.194, per_step_time: 1412ms, lr: 7.1437034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:08,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.66217 samples/s/p 2:17:15 } +2024-07-30 03:51:11,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 423/ 3125], loss: 0.341, per_step_time: 1413ms, lr: 7.1405816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:11,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.66013 samples/s/p 2:17:15 } +2024-07-30 03:51:14,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 425/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 7.137458e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:14,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.66026 samples/s/p 2:17:12 } +2024-07-30 03:51:17,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 427/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 7.1343343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:17,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.65853 samples/s/p 2:17:12 } +2024-07-30 03:51:20,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 429/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 7.131209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:20,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.66032 samples/s/p 2:17:07 } +2024-07-30 03:51:22,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 431/ 3125], loss: 0.251, per_step_time: 1414ms, lr: 7.128083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:22,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.65737 samples/s/p 2:17:08 } +2024-07-30 03:51:25,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 433/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 7.1249565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:25,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.65857 samples/s/p 2:17:03 } +2024-07-30 03:51:28,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 435/ 3125], loss: 0.294, per_step_time: 1414ms, lr: 7.1218287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:28,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.65610 samples/s/p 2:17:04 } +2024-07-30 03:51:31,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 437/ 3125], loss: 0.260, per_step_time: 1414ms, lr: 7.1187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:31,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.65411 samples/s/p 2:17:04 } +2024-07-30 03:51:34,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 439/ 3125], loss: 0.207, per_step_time: 1414ms, lr: 7.11557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:34,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |███████████████████ | 5.65750 samples/s/p 2:16:57 } +2024-07-30 03:51:37,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 441/ 3125], loss: 0.232, per_step_time: 1414ms, lr: 7.1124396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:37,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |███████████████████ | 5.65607 samples/s/p 2:16:56 } +2024-07-30 03:51:39,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 443/ 3125], loss: 0.282, per_step_time: 1412ms, lr: 7.109307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:39,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.66200 samples/s/p 2:16:44 } +2024-07-30 03:51:42,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 445/ 3125], loss: 0.195, per_step_time: 1412ms, lr: 7.106174e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:42,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.66199 samples/s/p 2:16:42 } +2024-07-30 03:51:45,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 447/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 7.103039e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:45,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.65982 samples/s/p 2:16:42 } +2024-07-30 03:51:48,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 449/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 7.0999045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:48,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.65818 samples/s/p 2:16:41 } +2024-07-30 03:51:51,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 451/ 3125], loss: 0.402, per_step_time: 1412ms, lr: 7.0967685e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:51,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.66295 samples/s/p 2:16:32 } +2024-07-30 03:51:54,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 453/ 3125], loss: 0.338, per_step_time: 1414ms, lr: 7.093632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:54,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.65659 samples/s/p 2:16:38 } +2024-07-30 03:51:56,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 455/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 7.0904944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:56,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.66062 samples/s/p 2:16:29 } +2024-07-30 03:51:59,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 457/ 3125], loss: 0.281, per_step_time: 1412ms, lr: 7.0873557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:59,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.66295 samples/s/p 2:16:23 } +2024-07-30 03:52:02,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 459/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 7.0842143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:02,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.66080 samples/s/p 2:16:24 } +2024-07-30 03:52:05,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 461/ 3125], loss: 0.285, per_step_time: 1412ms, lr: 7.081074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:05,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.66289 samples/s/p 2:16:18 } +2024-07-30 03:52:08,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 463/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 7.077932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:08,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.66033 samples/s/p 2:16:19 } +2024-07-30 03:52:11,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 465/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 7.0747888e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:11,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.66065 samples/s/p 2:16:15 } +2024-07-30 03:52:13,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 467/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 7.071645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:13,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.66078 samples/s/p 2:16:12 } +2024-07-30 03:52:16,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 469/ 3125], loss: 0.520, per_step_time: 1413ms, lr: 7.0685005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:16,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.65955 samples/s/p 2:16:11 } +2024-07-30 03:52:19,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 471/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 7.0653537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:19,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.65899 samples/s/p 2:16:09 } +2024-07-30 03:52:22,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 473/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 7.0622073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:22,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.65929 samples/s/p 2:16:06 } +2024-07-30 03:52:25,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 475/ 3125], loss: 0.113, per_step_time: 1413ms, lr: 7.0590595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:25,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.66052 samples/s/p 2:16:01 } +2024-07-30 03:52:28,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 477/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 7.055911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:28,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.65924 samples/s/p 2:16:00 } +2024-07-30 03:52:30,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 479/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 7.0527603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:30,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.65380 samples/s/p 2:16:05 } +2024-07-30 03:52:33,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 481/ 3125], loss: 0.377, per_step_time: 1413ms, lr: 7.0496094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:33,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.65842 samples/s/p 2:15:56 } +2024-07-30 03:52:36,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 483/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 7.046458e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:36,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.66117 samples/s/p 2:15:49 } +2024-07-30 03:52:39,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 485/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 7.043305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:39,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.66063 samples/s/p 2:15:47 } +2024-07-30 03:52:42,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 487/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 7.040151e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:42,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.66100 samples/s/p 2:15:44 } +2024-07-30 03:52:45,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 489/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 7.036997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:45,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.66061 samples/s/p 2:15:41 } +2024-07-30 03:52:47,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 491/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 7.033841e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:47,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.65907 samples/s/p 2:15:41 } +2024-07-30 03:52:50,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 493/ 3125], loss: 0.356, per_step_time: 1413ms, lr: 7.0306837e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:50,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.66123 samples/s/p 2:15:35 } +2024-07-30 03:52:53,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 495/ 3125], loss: 0.251, per_step_time: 1412ms, lr: 7.0275264e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:53,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.66201 samples/s/p 2:15:31 } +2024-07-30 03:52:56,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 497/ 3125], loss: 0.416, per_step_time: 1413ms, lr: 7.0243677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:56,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.66158 samples/s/p 2:15:29 } +2024-07-30 03:52:59,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 499/ 3125], loss: 0.212, per_step_time: 1412ms, lr: 7.0212086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:59,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.66177 samples/s/p 2:15:26 } +2024-07-30 03:53:02,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 501/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 7.018047e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:02,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.65918 samples/s/p 2:15:26 } +2024-07-30 03:53:04,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 503/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 7.014886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:04,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.65634 samples/s/p 2:15:28 } +2024-07-30 03:53:07,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 505/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 7.0117235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:07,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.65903 samples/s/p 2:15:21 } +2024-07-30 03:53:10,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 507/ 3125], loss: 0.252, per_step_time: 1412ms, lr: 7.0085603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:10,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.66265 samples/s/p 2:15:13 } +2024-07-30 03:53:13,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 509/ 3125], loss: 0.103, per_step_time: 1414ms, lr: 7.0053957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:13,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.65442 samples/s/p 2:15:22 } +2024-07-30 03:53:16,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 511/ 3125], loss: 0.140, per_step_time: 1414ms, lr: 7.0022306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:16,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.65542 samples/s/p 2:15:18 } +2024-07-30 03:53:19,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 513/ 3125], loss: 0.333, per_step_time: 1414ms, lr: 6.9990638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:19,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.65718 samples/s/p 2:15:12 } +2024-07-30 03:53:21,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 515/ 3125], loss: 0.159, per_step_time: 1412ms, lr: 6.9958965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:21,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.66192 samples/s/p 2:15:03 } +2024-07-30 03:53:24,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 517/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 6.9927287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:24,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.66062 samples/s/p 2:15:02 } +2024-07-30 03:53:27,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 519/ 3125], loss: 0.437, per_step_time: 1413ms, lr: 6.9895596e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:27,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.66092 samples/s/p 2:14:59 } +2024-07-30 03:53:30,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 521/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 6.9863895e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:30,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.66156 samples/s/p 2:14:55 } +2024-07-30 03:53:33,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 523/ 3125], loss: 0.258, per_step_time: 1420ms, lr: 6.983218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:33,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.63011 samples/s/p 2:15:37 } +2024-07-30 03:53:36,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 525/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 6.980046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:36,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.66052 samples/s/p 2:14:51 } +2024-07-30 03:53:38,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 527/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 6.976873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:38,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.66078 samples/s/p 2:14:47 } +2024-07-30 03:53:41,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 529/ 3125], loss: 0.346, per_step_time: 1413ms, lr: 6.9736993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:41,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.65912 samples/s/p 2:14:47 } +2024-07-30 03:53:44,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 531/ 3125], loss: 0.420, per_step_time: 1413ms, lr: 6.9705247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:44,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.66071 samples/s/p 2:14:42 } +2024-07-30 03:53:47,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 533/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 6.967349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:47,448 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.65800 samples/s/p 2:14:43 } +2024-07-30 03:53:50,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 535/ 3125], loss: 0.098, per_step_time: 1414ms, lr: 6.964172e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:50,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.65487 samples/s/p 2:14:45 } +2024-07-30 03:53:53,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 537/ 3125], loss: 0.678, per_step_time: 1413ms, lr: 6.9609937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:53,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.65856 samples/s/p 2:14:36 } +2024-07-30 03:53:55,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 539/ 3125], loss: 0.108, per_step_time: 1413ms, lr: 6.957816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:55,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.66055 samples/s/p 2:14:31 } +2024-07-30 03:53:58,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 541/ 3125], loss: 0.110, per_step_time: 1413ms, lr: 6.9546363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:58,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.65828 samples/s/p 2:14:31 } +2024-07-30 03:54:01,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 543/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 6.9514554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:01,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.66058 samples/s/p 2:14:25 } +2024-07-30 03:54:04,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 545/ 3125], loss: 0.292, per_step_time: 1413ms, lr: 6.9482744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:04,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.65966 samples/s/p 2:14:24 } +2024-07-30 03:54:07,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 547/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 6.945091e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:07,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.66021 samples/s/p 2:14:20 } +2024-07-30 03:54:10,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 549/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 6.9419084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:10,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.66138 samples/s/p 2:14:15 } +2024-07-30 03:54:12,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 551/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 6.9387243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:12,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.66041 samples/s/p 2:14:14 } +2024-07-30 03:54:15,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 553/ 3125], loss: 0.216, per_step_time: 1417ms, lr: 6.935539e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:15,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.64201 samples/s/p 2:14:37 } +2024-07-30 03:54:18,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 555/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 6.9323532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:18,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.66167 samples/s/p 2:14:07 } +2024-07-30 03:54:21,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 557/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 6.929166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:21,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.66082 samples/s/p 2:14:05 } +2024-07-30 03:54:24,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 559/ 3125], loss: 0.148, per_step_time: 1413ms, lr: 6.9259777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:24,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.66058 samples/s/p 2:14:02 } +2024-07-30 03:54:27,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 561/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 6.9227895e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:27,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.66048 samples/s/p 2:14:00 } +2024-07-30 03:54:29,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 563/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 6.9195994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:29,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.66047 samples/s/p 2:13:57 } +2024-07-30 03:54:32,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 565/ 3125], loss: 0.587, per_step_time: 1413ms, lr: 6.916409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:32,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.66034 samples/s/p 2:13:54 } +2024-07-30 03:54:35,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 567/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 6.913218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:35,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.65970 samples/s/p 2:13:52 } +2024-07-30 03:54:38,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 569/ 3125], loss: 0.142, per_step_time: 1413ms, lr: 6.9100247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:38,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.65832 samples/s/p 2:13:52 } +2024-07-30 03:54:41,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 571/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 6.9068315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:41,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.65959 samples/s/p 2:13:47 } +2024-07-30 03:54:44,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 573/ 3125], loss: 0.064, per_step_time: 1416ms, lr: 6.9036373e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:44,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.64611 samples/s/p 2:14:03 } +2024-07-30 03:54:46,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 575/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 6.9004423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:46,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.66097 samples/s/p 2:13:39 } +2024-07-30 03:54:49,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 577/ 3125], loss: 0.460, per_step_time: 1413ms, lr: 6.8972463e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:49,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.65861 samples/s/p 2:13:40 } +2024-07-30 03:54:52,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 579/ 3125], loss: 0.125, per_step_time: 1412ms, lr: 6.894049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:52,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.66197 samples/s/p 2:13:32 } +2024-07-30 03:54:55,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 581/ 3125], loss: 0.071, per_step_time: 1413ms, lr: 6.8908503e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:55,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.66115 samples/s/p 2:13:31 } +2024-07-30 03:54:58,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 583/ 3125], loss: 0.261, per_step_time: 1415ms, lr: 6.887652e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:58,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.65357 samples/s/p 2:13:39 } +2024-07-30 03:55:01,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 585/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 6.8844524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:01,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.65801 samples/s/p 2:13:29 } +2024-07-30 03:55:03,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 587/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 6.881252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:03,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.66109 samples/s/p 2:13:22 } +2024-07-30 03:55:06,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 589/ 3125], loss: 0.097, per_step_time: 1414ms, lr: 6.8780505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:06,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.65684 samples/s/p 2:13:25 } +2024-07-30 03:55:09,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 591/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 6.8748477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:09,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.66100 samples/s/p 2:13:17 } +2024-07-30 03:55:12,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 593/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 6.8716445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:12,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.66042 samples/s/p 2:13:15 } +2024-07-30 03:55:15,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 595/ 3125], loss: 0.161, per_step_time: 1414ms, lr: 6.8684403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:15,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.65650 samples/s/p 2:13:17 } +2024-07-30 03:55:18,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 597/ 3125], loss: 0.225, per_step_time: 1418ms, lr: 6.8652353e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:18,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.63981 samples/s/p 2:13:38 } +2024-07-30 03:55:21,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 599/ 3125], loss: 0.277, per_step_time: 1426ms, lr: 6.8620293e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:21,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.60845 samples/s/p 2:14:20 } +2024-07-30 03:55:23,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 601/ 3125], loss: 0.352, per_step_time: 1414ms, lr: 6.858822e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:23,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.65735 samples/s/p 2:13:08 } +2024-07-30 03:55:26,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 603/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 6.855614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:26,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.65837 samples/s/p 2:13:03 } +2024-07-30 03:55:29,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 605/ 3125], loss: 0.471, per_step_time: 1413ms, lr: 6.852406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:29,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.65906 samples/s/p 2:13:00 } +2024-07-30 03:55:32,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 607/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 6.8491963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:32,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.65983 samples/s/p 2:12:56 } +2024-07-30 03:55:35,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 609/ 3125], loss: 0.238, per_step_time: 1414ms, lr: 6.8459854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:35,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.65734 samples/s/p 2:12:56 } +2024-07-30 03:55:38,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 611/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 6.8427744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:38,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.65809 samples/s/p 2:12:53 } +2024-07-30 03:55:40,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 613/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 6.8395625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:40,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.65893 samples/s/p 2:12:48 } +2024-07-30 03:55:43,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 615/ 3125], loss: 0.287, per_step_time: 1412ms, lr: 6.836349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:43,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.66208 samples/s/p 2:12:41 } +2024-07-30 03:55:46,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 617/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 6.833135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:46,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.65865 samples/s/p 2:12:43 } +2024-07-30 03:55:49,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 619/ 3125], loss: 0.128, per_step_time: 1412ms, lr: 6.829921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:49,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.66197 samples/s/p 2:12:36 } +2024-07-30 03:55:52,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 621/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 6.826705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:52,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |███████████████████ | 5.66048 samples/s/p 2:12:35 } +2024-07-30 03:55:55,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 623/ 3125], loss: 0.142, per_step_time: 1413ms, lr: 6.823488e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:55,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |███████████████████ | 5.66121 samples/s/p 2:12:31 } +2024-07-30 03:55:57,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 625/ 3125], loss: 0.120, per_step_time: 1413ms, lr: 6.8202708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:57,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.66031 samples/s/p 2:12:30 } +2024-07-30 03:56:00,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 627/ 3125], loss: 0.379, per_step_time: 1413ms, lr: 6.817053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:00,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.65801 samples/s/p 2:12:30 } +2024-07-30 03:56:03,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 629/ 3125], loss: 0.368, per_step_time: 1413ms, lr: 6.8138334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:03,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.66028 samples/s/p 2:12:24 } +2024-07-30 03:56:06,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 631/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 6.8106133e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:06,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.65878 samples/s/p 2:12:23 } +2024-07-30 03:56:09,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 633/ 3125], loss: 0.124, per_step_time: 1414ms, lr: 6.8073928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:09,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.65700 samples/s/p 2:12:23 } +2024-07-30 03:56:12,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 635/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 6.804171e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:12,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.65494 samples/s/p 2:12:23 } +2024-07-30 03:56:14,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 637/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 6.8009476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:14,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.65980 samples/s/p 2:12:13 } +2024-07-30 03:56:17,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 639/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 6.7977244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:17,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.65841 samples/s/p 2:12:12 } +2024-07-30 03:56:20,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 641/ 3125], loss: 0.334, per_step_time: 1412ms, lr: 6.7945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:20,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.66189 samples/s/p 2:12:05 } +2024-07-30 03:56:23,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 643/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 6.7912756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:23,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.66104 samples/s/p 2:12:03 } +2024-07-30 03:56:26,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 645/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 6.788049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:26,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.65995 samples/s/p 2:12:02 } +2024-07-30 03:56:29,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 647/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 6.7848214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:29,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.66008 samples/s/p 2:11:59 } +2024-07-30 03:56:31,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 649/ 3125], loss: 0.085, per_step_time: 1417ms, lr: 6.7815945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:31,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.64246 samples/s/p 2:12:21 } +2024-07-30 03:56:34,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 651/ 3125], loss: 0.368, per_step_time: 1413ms, lr: 6.7783653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:34,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.65892 samples/s/p 2:11:55 } +2024-07-30 03:56:37,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 653/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 6.7751357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:37,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.65935 samples/s/p 2:11:51 } +2024-07-30 03:56:40,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 655/ 3125], loss: 0.333, per_step_time: 1412ms, lr: 6.7719066e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:40,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.66190 samples/s/p 2:11:45 } +2024-07-30 03:56:43,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 657/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 6.768675e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:43,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.66148 samples/s/p 2:11:43 } +2024-07-30 03:56:46,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 659/ 3125], loss: 0.151, per_step_time: 1412ms, lr: 6.7654423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:46,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.66187 samples/s/p 2:11:39 } +2024-07-30 03:56:48,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 661/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 6.76221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:48,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.66025 samples/s/p 2:11:39 } +2024-07-30 03:56:51,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 663/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 6.7589763e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:51,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.65968 samples/s/p 2:11:37 } +2024-07-30 03:56:54,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 665/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 6.7557417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:54,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.66098 samples/s/p 2:11:32 } +2024-07-30 03:56:57,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 667/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 6.752506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:57,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.66048 samples/s/p 2:11:30 } +2024-07-30 03:57:00,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 669/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 6.7492706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:00,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.65998 samples/s/p 2:11:28 } +2024-07-30 03:57:03,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 671/ 3125], loss: 0.285, per_step_time: 1412ms, lr: 6.7460333e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:03,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.66181 samples/s/p 2:11:22 } +2024-07-30 03:57:05,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 673/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 6.742795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:05,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.65988 samples/s/p 2:11:22 } +2024-07-30 03:57:08,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 675/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 6.7395567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:08,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.66048 samples/s/p 2:11:19 } +2024-07-30 03:57:11,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 677/ 3125], loss: 0.427, per_step_time: 1414ms, lr: 6.736317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:11,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.65761 samples/s/p 2:11:20 } +2024-07-30 03:57:14,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 679/ 3125], loss: 0.160, per_step_time: 1414ms, lr: 6.733077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:14,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.65518 samples/s/p 2:11:20 } +2024-07-30 03:57:17,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 681/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 6.7298356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:17,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.65786 samples/s/p 2:11:14 } +2024-07-30 03:57:20,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 683/ 3125], loss: 0.352, per_step_time: 1414ms, lr: 6.7265933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:20,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.65726 samples/s/p 2:11:12 } +2024-07-30 03:57:22,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 685/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 6.723351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:22,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.66020 samples/s/p 2:11:05 } +2024-07-30 03:57:25,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 687/ 3125], loss: 0.426, per_step_time: 1413ms, lr: 6.7201063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:25,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.66015 samples/s/p 2:11:02 } +2024-07-30 03:57:28,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 689/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 6.7168626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:28,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.65921 samples/s/p 2:11:01 } +2024-07-30 03:57:31,405 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 691/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 6.7136175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:31,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.66130 samples/s/p 2:10:55 } +2024-07-30 03:57:34,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 693/ 3125], loss: 0.261, per_step_time: 1414ms, lr: 6.710371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:34,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.65515 samples/s/p 2:11:01 } +2024-07-30 03:57:37,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 695/ 3125], loss: 0.328, per_step_time: 1417ms, lr: 6.707124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:37,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.64537 samples/s/p 2:11:11 } +2024-07-30 03:57:39,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 697/ 3125], loss: 0.224, per_step_time: 1414ms, lr: 6.703876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:39,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.65767 samples/s/p 2:10:51 } +2024-07-30 03:57:42,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 699/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 6.700628e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:42,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.65848 samples/s/p 2:10:48 } +2024-07-30 03:57:45,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 701/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 6.6973794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:45,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.66059 samples/s/p 2:10:42 } +2024-07-30 03:57:48,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 703/ 3125], loss: 0.323, per_step_time: 1414ms, lr: 6.6941284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:48,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.65735 samples/s/p 2:10:43 } +2024-07-30 03:57:51,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 705/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 6.690877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:51,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.65966 samples/s/p 2:10:37 } +2024-07-30 03:57:54,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 707/ 3125], loss: 0.228, per_step_time: 1412ms, lr: 6.6876255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:54,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.66226 samples/s/p 2:10:31 } +2024-07-30 03:57:56,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 709/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 6.6843727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:56,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.66123 samples/s/p 2:10:30 } +2024-07-30 03:57:59,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 711/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 6.681119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:59,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.66050 samples/s/p 2:10:28 } +2024-07-30 03:58:02,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 713/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 6.6778657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:02,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.66033 samples/s/p 2:10:25 } +2024-07-30 03:58:05,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 715/ 3125], loss: 0.368, per_step_time: 1412ms, lr: 6.67461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:05,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.66250 samples/s/p 2:10:19 } +2024-07-30 03:58:08,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 717/ 3125], loss: 0.139, per_step_time: 1412ms, lr: 6.671354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:08,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.66281 samples/s/p 2:10:16 } +2024-07-30 03:58:11,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 719/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 6.6680977e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:11,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.66004 samples/s/p 2:10:17 } +2024-07-30 03:58:13,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 721/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 6.6648404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:13,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.65943 samples/s/p 2:10:15 } +2024-07-30 03:58:16,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 723/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 6.6615817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:16,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.66107 samples/s/p 2:10:10 } +2024-07-30 03:58:19,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 725/ 3125], loss: 0.420, per_step_time: 1416ms, lr: 6.6583234e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:19,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.64763 samples/s/p 2:10:26 } +2024-07-30 03:58:22,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 727/ 3125], loss: 0.105, per_step_time: 1413ms, lr: 6.6550633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:22,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.65836 samples/s/p 2:10:08 } +2024-07-30 03:58:25,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 729/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 6.6518032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:25,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.66050 samples/s/p 2:10:02 } +2024-07-30 03:58:28,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 731/ 3125], loss: 0.259, per_step_time: 1412ms, lr: 6.648541e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:28,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.66277 samples/s/p 2:09:56 } +2024-07-30 03:58:30,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 733/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 6.6452794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:30,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.66114 samples/s/p 2:09:56 } +2024-07-30 03:58:33,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 735/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 6.6420166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:33,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.66132 samples/s/p 2:09:53 } +2024-07-30 03:58:36,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 737/ 3125], loss: 0.189, per_step_time: 1414ms, lr: 6.6387524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:36,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.65669 samples/s/p 2:09:56 } +2024-07-30 03:58:39,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 739/ 3125], loss: 0.179, per_step_time: 1414ms, lr: 6.6354874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:39,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.65760 samples/s/p 2:09:52 } +2024-07-30 03:58:42,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 741/ 3125], loss: 0.483, per_step_time: 1413ms, lr: 6.632223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:42,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.65786 samples/s/p 2:09:49 } +2024-07-30 03:58:45,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 743/ 3125], loss: 0.356, per_step_time: 1413ms, lr: 6.6289567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:45,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.65817 samples/s/p 2:09:46 } +2024-07-30 03:58:47,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 745/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 6.62569e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:47,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.66097 samples/s/p 2:09:39 } +2024-07-30 03:58:50,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 747/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 6.622422e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:50,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.65933 samples/s/p 2:09:39 } +2024-07-30 03:58:53,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 749/ 3125], loss: 0.377, per_step_time: 1413ms, lr: 6.6191533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:53,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.66134 samples/s/p 2:09:33 } +2024-07-30 03:58:56,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 751/ 3125], loss: 0.137, per_step_time: 1413ms, lr: 6.6158846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:56,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.65937 samples/s/p 2:09:33 } +2024-07-30 03:58:59,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 753/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 6.612614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:59,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.66125 samples/s/p 2:09:27 } +2024-07-30 03:59:02,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 755/ 3125], loss: 0.384, per_step_time: 1413ms, lr: 6.6093444e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:02,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.66150 samples/s/p 2:09:24 } +2024-07-30 03:59:04,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 757/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 6.6060725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:04,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.66113 samples/s/p 2:09:22 } +2024-07-30 03:59:07,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 759/ 3125], loss: 0.215, per_step_time: 1412ms, lr: 6.6028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:07,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.66204 samples/s/p 2:09:18 } +2024-07-30 03:59:10,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 761/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 6.599527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:10,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.66146 samples/s/p 2:09:16 } +2024-07-30 03:59:13,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 763/ 3125], loss: 0.551, per_step_time: 1413ms, lr: 6.5962536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:13,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.66052 samples/s/p 2:09:14 } +2024-07-30 03:59:16,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 765/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 6.5929794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:16,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.66018 samples/s/p 2:09:12 } +2024-07-30 03:59:19,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 767/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 6.5897034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:19,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.65987 samples/s/p 2:09:10 } +2024-07-30 03:59:21,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 769/ 3125], loss: 0.385, per_step_time: 1413ms, lr: 6.5864274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:21,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.66123 samples/s/p 2:09:05 } +2024-07-30 03:59:24,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 771/ 3125], loss: 0.358, per_step_time: 1415ms, lr: 6.5831505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:24,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.65310 samples/s/p 2:09:13 } +2024-07-30 03:59:27,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 773/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 6.5798736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:27,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.65924 samples/s/p 2:09:02 } +2024-07-30 03:59:30,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 775/ 3125], loss: 0.327, per_step_time: 1412ms, lr: 6.5765944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:30,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.66173 samples/s/p 2:08:56 } +2024-07-30 03:59:33,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 777/ 3125], loss: 0.330, per_step_time: 1413ms, lr: 6.5733157e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:33,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.65844 samples/s/p 2:08:57 } +2024-07-30 03:59:36,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 779/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 6.570036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:36,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.65972 samples/s/p 2:08:53 } +2024-07-30 03:59:38,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 781/ 3125], loss: 0.368, per_step_time: 1412ms, lr: 6.5667555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:38,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.66183 samples/s/p 2:08:47 } +2024-07-30 03:59:41,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 783/ 3125], loss: 0.307, per_step_time: 1412ms, lr: 6.5634736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:41,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.66192 samples/s/p 2:08:44 } +2024-07-30 03:59:44,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 785/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 6.560192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:44,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.65889 samples/s/p 2:08:45 } +2024-07-30 03:59:47,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 787/ 3125], loss: 0.200, per_step_time: 1414ms, lr: 6.556909e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:47,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.65598 samples/s/p 2:08:47 } +2024-07-30 03:59:50,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 789/ 3125], loss: 0.394, per_step_time: 1413ms, lr: 6.553625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:50,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.65840 samples/s/p 2:08:40 } +2024-07-30 03:59:53,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 791/ 3125], loss: 0.308, per_step_time: 1412ms, lr: 6.550342e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:53,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.66174 samples/s/p 2:08:33 } +2024-07-30 03:59:55,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 793/ 3125], loss: 0.298, per_step_time: 1414ms, lr: 6.5470563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:55,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.65684 samples/s/p 2:08:37 } +2024-07-30 03:59:58,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 795/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 6.5437703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:58,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.66127 samples/s/p 2:08:28 } +2024-07-30 04:00:01,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 797/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 6.540484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:01,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.65931 samples/s/p 2:08:28 } +2024-07-30 04:00:04,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 799/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 6.5371964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:04,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.66021 samples/s/p 2:08:24 } +2024-07-30 04:00:07,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 801/ 3125], loss: 0.258, per_step_time: 1445ms, lr: 6.5339086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:07,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.53602 samples/s/p 2:11:14 } +2024-07-30 04:00:10,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 803/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 6.53062e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:10,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.66147 samples/s/p 2:08:16 } +2024-07-30 04:00:13,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 805/ 3125], loss: 0.134, per_step_time: 1413ms, lr: 6.5273302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:13,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.65832 samples/s/p 2:08:18 } +2024-07-30 04:00:15,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 807/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 6.5240406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:15,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.65956 samples/s/p 2:08:13 } +2024-07-30 04:00:18,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 809/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 6.5207496e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:18,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |████████████████████ | 5.65994 samples/s/p 2:08:10 } +2024-07-30 04:00:21,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 811/ 3125], loss: 0.194, per_step_time: 1412ms, lr: 6.5174577e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:21,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |████████████████████ | 5.66317 samples/s/p 2:08:03 } +2024-07-30 04:00:24,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 813/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 6.5141653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:24,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.66057 samples/s/p 2:08:04 } +2024-07-30 04:00:27,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 815/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 6.510872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:27,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.66128 samples/s/p 2:08:00 } +2024-07-30 04:00:30,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 817/ 3125], loss: 0.292, per_step_time: 1413ms, lr: 6.507578e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:30,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.66023 samples/s/p 2:07:58 } +2024-07-30 04:00:32,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 819/ 3125], loss: 0.129, per_step_time: 1413ms, lr: 6.504284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:32,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.65924 samples/s/p 2:07:57 } +2024-07-30 04:00:35,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 821/ 3125], loss: 0.313, per_step_time: 1412ms, lr: 6.500989e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:35,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.66175 samples/s/p 2:07:51 } +2024-07-30 04:00:38,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 823/ 3125], loss: 0.091, per_step_time: 1413ms, lr: 6.497693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:38,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.65904 samples/s/p 2:07:51 } +2024-07-30 04:00:41,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 825/ 3125], loss: 0.179, per_step_time: 1412ms, lr: 6.494396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:41,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.66367 samples/s/p 2:07:42 } +2024-07-30 04:00:44,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 827/ 3125], loss: 0.490, per_step_time: 1413ms, lr: 6.4910982e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:44,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.65957 samples/s/p 2:07:45 } +2024-07-30 04:00:47,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 829/ 3125], loss: 0.243, per_step_time: 1412ms, lr: 6.4878004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:47,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.66180 samples/s/p 2:07:39 } +2024-07-30 04:00:49,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 831/ 3125], loss: 0.435, per_step_time: 1413ms, lr: 6.4845017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:49,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.66149 samples/s/p 2:07:37 } +2024-07-30 04:00:52,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 833/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 6.481202e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:52,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.65912 samples/s/p 2:07:37 } +2024-07-30 04:00:55,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 835/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 6.4779024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:55,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.65979 samples/s/p 2:07:33 } +2024-07-30 04:00:58,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 837/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 6.474601e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:58,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.66146 samples/s/p 2:07:28 } +2024-07-30 04:01:01,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 839/ 3125], loss: 0.248, per_step_time: 1414ms, lr: 6.4712985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:01,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.65451 samples/s/p 2:07:35 } +2024-07-30 04:01:04,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 841/ 3125], loss: 0.375, per_step_time: 1412ms, lr: 6.4679966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:04,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.66200 samples/s/p 2:07:22 } +2024-07-30 04:01:06,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 843/ 3125], loss: 0.422, per_step_time: 1414ms, lr: 6.464694e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:06,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.65609 samples/s/p 2:07:27 } +2024-07-30 04:01:09,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 845/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 6.4613905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:09,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.66165 samples/s/p 2:07:17 } +2024-07-30 04:01:12,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 847/ 3125], loss: 0.428, per_step_time: 1414ms, lr: 6.4580854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:12,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.65766 samples/s/p 2:07:19 } +2024-07-30 04:01:15,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 849/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 6.4547808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:15,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.65816 samples/s/p 2:07:16 } +2024-07-30 04:01:18,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 851/ 3125], loss: 0.377, per_step_time: 1414ms, lr: 6.4514747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:18,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.65737 samples/s/p 2:07:14 } +2024-07-30 04:01:21,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 853/ 3125], loss: 0.229, per_step_time: 1415ms, lr: 6.448168e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:21,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.65351 samples/s/p 2:07:17 } +2024-07-30 04:01:23,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 855/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 6.4448614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:23,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.66131 samples/s/p 2:07:03 } +2024-07-30 04:01:26,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 857/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 6.4415535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:26,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.66127 samples/s/p 2:07:00 } +2024-07-30 04:01:29,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 859/ 3125], loss: 0.122, per_step_time: 1413ms, lr: 6.4382443e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:29,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.65918 samples/s/p 2:07:00 } +2024-07-30 04:01:32,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 861/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 6.434935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:32,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.66074 samples/s/p 2:06:55 } +2024-07-30 04:01:35,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 863/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 6.4316255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:35,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.66122 samples/s/p 2:06:52 } +2024-07-30 04:01:38,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 865/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 6.428315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:38,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.65855 samples/s/p 2:06:53 } +2024-07-30 04:01:40,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 867/ 3125], loss: 0.485, per_step_time: 1414ms, lr: 6.425004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:40,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.65704 samples/s/p 2:06:52 } +2024-07-30 04:01:43,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 869/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 6.4216915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:43,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.66005 samples/s/p 2:06:45 } +2024-07-30 04:01:46,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 871/ 3125], loss: 0.200, per_step_time: 1412ms, lr: 6.4183782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:46,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.66211 samples/s/p 2:06:39 } +2024-07-30 04:01:49,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 873/ 3125], loss: 0.219, per_step_time: 1414ms, lr: 6.4150654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:49,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.65606 samples/s/p 2:06:45 } +2024-07-30 04:01:52,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 875/ 3125], loss: 0.493, per_step_time: 1412ms, lr: 6.411751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:52,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.66256 samples/s/p 2:06:33 } +2024-07-30 04:01:55,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 877/ 3125], loss: 0.635, per_step_time: 1413ms, lr: 6.408436e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:55,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.66036 samples/s/p 2:06:33 } +2024-07-30 04:01:57,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 879/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 6.4051214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:57,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.66062 samples/s/p 2:06:30 } +2024-07-30 04:02:00,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 881/ 3125], loss: 0.363, per_step_time: 1413ms, lr: 6.401805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:00,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.66143 samples/s/p 2:06:26 } +2024-07-30 04:02:03,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 883/ 3125], loss: 0.295, per_step_time: 1425ms, lr: 6.398488e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:03,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.61306 samples/s/p 2:07:29 } +2024-07-30 04:02:06,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 885/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 6.3951707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:06,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.66136 samples/s/p 2:06:21 } +2024-07-30 04:02:09,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 887/ 3125], loss: 0.270, per_step_time: 1414ms, lr: 6.391853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:09,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.65652 samples/s/p 2:06:24 } +2024-07-30 04:02:12,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 889/ 3125], loss: 0.163, per_step_time: 1417ms, lr: 6.388534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:12,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.64524 samples/s/p 2:06:37 } +2024-07-30 04:02:14,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 891/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 6.385215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:14,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.65916 samples/s/p 2:06:15 } +2024-07-30 04:02:17,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 893/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 6.3818943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:17,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.65942 samples/s/p 2:06:12 } +2024-07-30 04:02:20,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 895/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 6.378574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:20,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.66163 samples/s/p 2:06:06 } +2024-07-30 04:02:23,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 897/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 6.3752523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:23,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.66121 samples/s/p 2:06:04 } +2024-07-30 04:02:26,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 899/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 6.371931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:26,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.65905 samples/s/p 2:06:04 } +2024-07-30 04:02:29,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 901/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 6.3686084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:29,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.66112 samples/s/p 2:05:58 } +2024-07-30 04:02:31,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 903/ 3125], loss: 0.049, per_step_time: 1413ms, lr: 6.3652847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:31,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.66097 samples/s/p 2:05:56 } +2024-07-30 04:02:34,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 905/ 3125], loss: 0.419, per_step_time: 1412ms, lr: 6.36196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:34,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.66185 samples/s/p 2:05:52 } +2024-07-30 04:02:37,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 907/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 6.358636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:37,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.65873 samples/s/p 2:05:53 } +2024-07-30 04:02:40,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 909/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 6.3553107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:40,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.66102 samples/s/p 2:05:47 } +2024-07-30 04:02:43,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 911/ 3125], loss: 0.361, per_step_time: 1412ms, lr: 6.3519847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:43,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.66229 samples/s/p 2:05:43 } +2024-07-30 04:02:46,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 913/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 6.3486586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:46,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.66140 samples/s/p 2:05:41 } +2024-07-30 04:02:48,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 915/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 6.345331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:48,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.66054 samples/s/p 2:05:39 } +2024-07-30 04:02:51,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 917/ 3125], loss: 0.467, per_step_time: 1412ms, lr: 6.342003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:51,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.66206 samples/s/p 2:05:35 } +2024-07-30 04:02:54,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 919/ 3125], loss: 0.285, per_step_time: 1414ms, lr: 6.338674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:54,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.65725 samples/s/p 2:05:38 } +2024-07-30 04:02:57,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 921/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 6.3353455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:57,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.66079 samples/s/p 2:05:31 } +2024-07-30 04:03:00,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 923/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 6.332016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:00,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.66153 samples/s/p 2:05:27 } +2024-07-30 04:03:03,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 925/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 6.3286852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:03,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.66110 samples/s/p 2:05:25 } +2024-07-30 04:03:05,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 927/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 6.3253538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:05,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.65954 samples/s/p 2:05:24 } +2024-07-30 04:03:08,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 929/ 3125], loss: 0.325, per_step_time: 1414ms, lr: 6.3220227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:08,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.65531 samples/s/p 2:05:27 } +2024-07-30 04:03:11,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 931/ 3125], loss: 0.215, per_step_time: 1414ms, lr: 6.318691e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:11,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.65751 samples/s/p 2:05:21 } +2024-07-30 04:03:14,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 933/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 6.315357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:14,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.65837 samples/s/p 2:05:17 } +2024-07-30 04:03:17,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 935/ 3125], loss: 0.239, per_step_time: 1414ms, lr: 6.3120237e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:17,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.65504 samples/s/p 2:05:18 } +2024-07-30 04:03:20,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 937/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 6.308689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:20,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.65992 samples/s/p 2:05:09 } +2024-07-30 04:03:22,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 939/ 3125], loss: 0.109, per_step_time: 1412ms, lr: 6.305355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:22,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.66171 samples/s/p 2:05:04 } +2024-07-30 04:03:25,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 941/ 3125], loss: 0.261, per_step_time: 1412ms, lr: 6.3020193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:25,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.66303 samples/s/p 2:04:59 } +2024-07-30 04:03:28,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 943/ 3125], loss: 0.153, per_step_time: 1419ms, lr: 6.2986833e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:28,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.63473 samples/s/p 2:05:34 } +2024-07-30 04:03:31,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 945/ 3125], loss: 0.131, per_step_time: 1414ms, lr: 6.2953472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:31,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.65716 samples/s/p 2:05:01 } +2024-07-30 04:03:34,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 947/ 3125], loss: 0.170, per_step_time: 1418ms, lr: 6.2920094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:34,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.64148 samples/s/p 2:05:20 } +2024-07-30 04:03:37,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 949/ 3125], loss: 0.456, per_step_time: 1413ms, lr: 6.2886706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:37,140 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.66069 samples/s/p 2:04:51 } +2024-07-30 04:03:39,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 951/ 3125], loss: 0.128, per_step_time: 1412ms, lr: 6.2853323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:39,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.66216 samples/s/p 2:04:46 } +2024-07-30 04:03:42,807 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 953/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 6.281994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:42,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.65836 samples/s/p 2:04:49 } +2024-07-30 04:03:45,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 955/ 3125], loss: 0.234, per_step_time: 1412ms, lr: 6.2786535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:45,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.66240 samples/s/p 2:04:40 } +2024-07-30 04:03:48,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 957/ 3125], loss: 0.221, per_step_time: 1414ms, lr: 6.2753134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:48,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.65740 samples/s/p 2:04:44 } +2024-07-30 04:03:51,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 959/ 3125], loss: 0.198, per_step_time: 1414ms, lr: 6.2719723e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:51,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.65587 samples/s/p 2:04:43 } +2024-07-30 04:03:54,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 961/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 6.2686304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:54,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.66165 samples/s/p 2:04:33 } +2024-07-30 04:03:56,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 963/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 6.2652884e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:56,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.66125 samples/s/p 2:04:31 } +2024-07-30 04:03:59,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 965/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 6.2619456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:59,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.66165 samples/s/p 2:04:27 } +2024-07-30 04:04:02,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 967/ 3125], loss: 0.455, per_step_time: 1413ms, lr: 6.2586028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:02,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.66115 samples/s/p 2:04:25 } +2024-07-30 04:04:05,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 969/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 6.255258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:05,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.66007 samples/s/p 2:04:24 } +2024-07-30 04:04:08,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 971/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 6.2519143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:08,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.66025 samples/s/p 2:04:21 } +2024-07-30 04:04:11,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 973/ 3125], loss: 0.444, per_step_time: 1413ms, lr: 6.2485683e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:11,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.65851 samples/s/p 2:04:20 } +2024-07-30 04:04:13,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 975/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 6.245223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:13,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.66115 samples/s/p 2:04:14 } +2024-07-30 04:04:16,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 977/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 6.2418762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:16,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.66026 samples/s/p 2:04:12 } +2024-07-30 04:04:19,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 979/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 6.2385297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:19,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.66082 samples/s/p 2:04:09 } +2024-07-30 04:04:22,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 981/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 6.2351824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:22,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.65828 samples/s/p 2:04:09 } +2024-07-30 04:04:25,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 983/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 6.2318336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:25,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.65797 samples/s/p 2:04:07 } +2024-07-30 04:04:28,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 985/ 3125], loss: 0.249, per_step_time: 1414ms, lr: 6.228485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:28,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.65549 samples/s/p 2:04:07 } +2024-07-30 04:04:30,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 987/ 3125], loss: 0.120, per_step_time: 1413ms, lr: 6.2251356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:30,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.65782 samples/s/p 2:04:01 } +2024-07-30 04:04:33,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 989/ 3125], loss: 0.135, per_step_time: 1418ms, lr: 6.221786e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:33,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.63951 samples/s/p 2:04:23 } +2024-07-30 04:04:36,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 991/ 3125], loss: 0.239, per_step_time: 1412ms, lr: 6.218435e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:36,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.66227 samples/s/p 2:03:50 } +2024-07-30 04:04:39,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 993/ 3125], loss: 0.431, per_step_time: 1415ms, lr: 6.215085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:39,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.65103 samples/s/p 2:04:02 } +2024-07-30 04:04:42,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 995/ 3125], loss: 0.215, per_step_time: 1417ms, lr: 6.2117324e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:42,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.64299 samples/s/p 2:04:09 } +2024-07-30 04:04:45,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 997/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 6.2083805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:45,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |█████████████████████ | 5.66120 samples/s/p 2:03:43 } +2024-07-30 04:04:48,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 999/ 3125], loss: 0.067, per_step_time: 1413ms, lr: 6.205027e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:48,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |█████████████████████ | 5.65867 samples/s/p 2:03:43 } +2024-07-30 04:04:50,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1001/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 6.2016743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:50,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.66057 samples/s/p 2:03:38 } +2024-07-30 04:04:53,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1003/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 6.19832e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:53,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.65890 samples/s/p 2:03:37 } +2024-07-30 04:04:56,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1005/ 3125], loss: 0.246, per_step_time: 1412ms, lr: 6.194966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:56,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.66186 samples/s/p 2:03:30 } +2024-07-30 04:04:59,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1007/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 6.19161e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:59,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.65838 samples/s/p 2:03:32 } +2024-07-30 04:05:02,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1009/ 3125], loss: 0.139, per_step_time: 1413ms, lr: 6.1882547e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:02,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.66162 samples/s/p 2:03:25 } +2024-07-30 04:05:05,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1011/ 3125], loss: 0.428, per_step_time: 1418ms, lr: 6.1848987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:05,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.63863 samples/s/p 2:03:53 } +2024-07-30 04:05:07,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1013/ 3125], loss: 0.426, per_step_time: 1417ms, lr: 6.1815417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:07,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.64350 samples/s/p 2:03:43 } +2024-07-30 04:05:10,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1015/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 6.178185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:10,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.66095 samples/s/p 2:03:18 } +2024-07-30 04:05:13,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1017/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 6.174826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:13,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.65860 samples/s/p 2:03:18 } +2024-07-30 04:05:16,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1019/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 6.1714672e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:16,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.65781 samples/s/p 2:03:16 } +2024-07-30 04:05:19,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1021/ 3125], loss: 0.113, per_step_time: 1413ms, lr: 6.1681085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:19,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.66109 samples/s/p 2:03:09 } +2024-07-30 04:05:22,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1023/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 6.1647493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:22,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.66038 samples/s/p 2:03:07 } +2024-07-30 04:05:24,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1025/ 3125], loss: 0.211, per_step_time: 1414ms, lr: 6.161389e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:24,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.65381 samples/s/p 2:03:13 } +2024-07-30 04:05:27,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1027/ 3125], loss: 0.275, per_step_time: 1414ms, lr: 6.158028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:27,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.65728 samples/s/p 2:03:05 } +2024-07-30 04:05:30,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1029/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 6.1546666e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:30,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.65911 samples/s/p 2:03:00 } +2024-07-30 04:05:33,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1031/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 6.1513047e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:33,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.65891 samples/s/p 2:02:58 } +2024-07-30 04:05:36,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1033/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 6.147943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:36,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.65982 samples/s/p 2:02:54 } +2024-07-30 04:05:39,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1035/ 3125], loss: 0.040, per_step_time: 1412ms, lr: 6.1445794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:39,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.66218 samples/s/p 2:02:48 } +2024-07-30 04:05:41,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1037/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 6.1412165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:41,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.65985 samples/s/p 2:02:48 } +2024-07-30 04:05:44,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1039/ 3125], loss: 0.218, per_step_time: 1412ms, lr: 6.137852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:44,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.66252 samples/s/p 2:02:42 } +2024-07-30 04:05:47,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1041/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 6.134487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:47,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.66147 samples/s/p 2:02:40 } +2024-07-30 04:05:50,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1043/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 6.131122e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:50,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.66083 samples/s/p 2:02:38 } +2024-07-30 04:05:53,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1045/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 6.1277565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:53,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.66045 samples/s/p 2:02:36 } +2024-07-30 04:05:56,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1047/ 3125], loss: 0.124, per_step_time: 1413ms, lr: 6.124391e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:56,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.66003 samples/s/p 2:02:34 } +2024-07-30 04:05:58,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1049/ 3125], loss: 0.225, per_step_time: 1414ms, lr: 6.121024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:58,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.65743 samples/s/p 2:02:34 } +2024-07-30 04:06:01,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1051/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 6.117656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:01,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.65840 samples/s/p 2:02:30 } +2024-07-30 04:06:04,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1053/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 6.114288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:04,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.65839 samples/s/p 2:02:27 } +2024-07-30 04:06:07,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1055/ 3125], loss: 0.335, per_step_time: 1413ms, lr: 6.1109204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:07,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.66023 samples/s/p 2:02:22 } +2024-07-30 04:06:10,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1057/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 6.107551e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:10,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.66030 samples/s/p 2:02:19 } +2024-07-30 04:06:13,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1059/ 3125], loss: 0.107, per_step_time: 1412ms, lr: 6.1041824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:13,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.66225 samples/s/p 2:02:14 } +2024-07-30 04:06:15,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1061/ 3125], loss: 0.301, per_step_time: 1412ms, lr: 6.100812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:15,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.66188 samples/s/p 2:02:11 } +2024-07-30 04:06:18,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1063/ 3125], loss: 0.454, per_step_time: 1412ms, lr: 6.097441e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:18,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.66198 samples/s/p 2:02:08 } +2024-07-30 04:06:21,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1065/ 3125], loss: 0.363, per_step_time: 1413ms, lr: 6.0940706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:21,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.65973 samples/s/p 2:02:08 } +2024-07-30 04:06:24,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1067/ 3125], loss: 0.380, per_step_time: 1413ms, lr: 6.090699e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:24,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.66124 samples/s/p 2:02:04 } +2024-07-30 04:06:27,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1069/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 6.0873276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:27,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.65995 samples/s/p 2:02:03 } +2024-07-30 04:06:30,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1071/ 3125], loss: 0.271, per_step_time: 1412ms, lr: 6.083955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:30,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.66185 samples/s/p 2:01:57 } +2024-07-30 04:06:32,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1073/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 6.0805814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:32,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.65949 samples/s/p 2:01:57 } +2024-07-30 04:06:35,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1075/ 3125], loss: 0.729, per_step_time: 1413ms, lr: 6.0772086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:35,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.65976 samples/s/p 2:01:54 } +2024-07-30 04:06:35,720 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 04:07:10,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1077/ 3125], loss: 0.403, per_step_time: 2378ms, lr: 6.0738334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:10,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 3.36354 samples/s/p 3:25:03 } +2024-07-30 04:07:13,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1079/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 6.070459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:13,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.66007 samples/s/p 2:01:48 } +2024-07-30 04:07:16,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1081/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 6.0670845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:16,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.65995 samples/s/p 2:01:46 } +2024-07-30 04:07:18,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1083/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 6.0637085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:18,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.65785 samples/s/p 2:01:45 } +2024-07-30 04:07:21,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1085/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 6.060332e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:21,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.66011 samples/s/p 2:01:40 } +2024-07-30 04:07:24,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1087/ 3125], loss: 0.442, per_step_time: 1413ms, lr: 6.056956e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:24,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.65817 samples/s/p 2:01:39 } +2024-07-30 04:07:27,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1089/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 6.0535785e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:27,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.65873 samples/s/p 2:01:36 } +2024-07-30 04:07:30,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1091/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 6.0502007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:30,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.65948 samples/s/p 2:01:32 } +2024-07-30 04:07:33,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1093/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 6.0468233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:33,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.66130 samples/s/p 2:01:27 } +2024-07-30 04:07:35,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1095/ 3125], loss: 0.273, per_step_time: 1415ms, lr: 6.043444e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:35,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.65063 samples/s/p 2:01:38 } +2024-07-30 04:07:38,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1097/ 3125], loss: 0.269, per_step_time: 1414ms, lr: 6.0400653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:38,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.65703 samples/s/p 2:01:27 } +2024-07-30 04:07:41,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1099/ 3125], loss: 0.246, per_step_time: 1412ms, lr: 6.0366856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:41,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.66188 samples/s/p 2:01:18 } +2024-07-30 04:07:44,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1101/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 6.0333055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:44,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.65991 samples/s/p 2:01:17 } +2024-07-30 04:07:47,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1103/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 6.0299253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:47,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.66158 samples/s/p 2:01:12 } +2024-07-30 04:07:50,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1105/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 6.026544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:50,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.65853 samples/s/p 2:01:13 } +2024-07-30 04:07:52,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1107/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 6.023162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:52,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.65886 samples/s/p 2:01:10 } +2024-07-30 04:07:55,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1109/ 3125], loss: 0.299, per_step_time: 1412ms, lr: 6.01978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:55,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.66191 samples/s/p 2:01:03 } +2024-07-30 04:07:58,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1111/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 6.016398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:58,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.65988 samples/s/p 2:01:03 } +2024-07-30 04:08:01,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1113/ 3125], loss: 0.096, per_step_time: 1413ms, lr: 6.013014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:01,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.65803 samples/s/p 2:01:03 } +2024-07-30 04:08:04,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1115/ 3125], loss: 0.193, per_step_time: 1412ms, lr: 6.009631e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:04,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.66178 samples/s/p 2:00:55 } +2024-07-30 04:08:07,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1117/ 3125], loss: 0.078, per_step_time: 1415ms, lr: 6.0062466e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:07,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.65248 samples/s/p 2:01:04 } +2024-07-30 04:08:09,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1119/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 6.0028624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:09,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.66124 samples/s/p 2:00:50 } +2024-07-30 04:08:12,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1121/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 5.9994773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:12,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.66077 samples/s/p 2:00:48 } +2024-07-30 04:08:15,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1123/ 3125], loss: 0.316, per_step_time: 1414ms, lr: 5.9960917e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:15,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.65491 samples/s/p 2:00:53 } +2024-07-30 04:08:18,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1125/ 3125], loss: 0.346, per_step_time: 1413ms, lr: 5.992706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:18,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.65954 samples/s/p 2:00:44 } +2024-07-30 04:08:21,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1127/ 3125], loss: 0.462, per_step_time: 1414ms, lr: 5.9893196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:21,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.65767 samples/s/p 2:00:43 } +2024-07-30 04:08:24,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1129/ 3125], loss: 0.196, per_step_time: 1414ms, lr: 5.985932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:24,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.65755 samples/s/p 2:00:41 } +2024-07-30 04:08:26,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1131/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 5.9825456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:26,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.66024 samples/s/p 2:00:35 } +2024-07-30 04:08:29,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1133/ 3125], loss: 0.263, per_step_time: 1415ms, lr: 5.9791573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:29,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.65308 samples/s/p 2:00:41 } +2024-07-30 04:08:32,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1135/ 3125], loss: 0.382, per_step_time: 1413ms, lr: 5.975769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:32,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.66104 samples/s/p 2:00:28 } +2024-07-30 04:08:35,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1137/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 5.9723807e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:35,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.66039 samples/s/p 2:00:26 } +2024-07-30 04:08:38,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1139/ 3125], loss: 0.242, per_step_time: 1412ms, lr: 5.968991e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:38,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.66228 samples/s/p 2:00:21 } +2024-07-30 04:08:41,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1141/ 3125], loss: 0.280, per_step_time: 1412ms, lr: 5.9656018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:41,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.66228 samples/s/p 2:00:18 } +2024-07-30 04:08:43,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1143/ 3125], loss: 0.434, per_step_time: 1413ms, lr: 5.962211e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:43,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.66044 samples/s/p 2:00:17 } +2024-07-30 04:08:46,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1145/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 5.958821e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:46,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.66139 samples/s/p 2:00:13 } +2024-07-30 04:08:49,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1147/ 3125], loss: 0.402, per_step_time: 1416ms, lr: 5.95543e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:49,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.64881 samples/s/p 2:00:27 } +2024-07-30 04:08:52,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1149/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 5.952038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:52,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.65976 samples/s/p 2:00:10 } +2024-07-30 04:08:55,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1151/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 5.948646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:55,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.65954 samples/s/p 2:00:07 } +2024-07-30 04:08:58,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1153/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 5.9452536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:58,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.66066 samples/s/p 2:00:03 } +2024-07-30 04:09:00,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1155/ 3125], loss: 0.255, per_step_time: 1412ms, lr: 5.941861e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:00,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.66238 samples/s/p 1:59:58 } +2024-07-30 04:09:03,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1157/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 5.9384674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:03,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.66089 samples/s/p 1:59:57 } +2024-07-30 04:09:06,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1159/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 5.935074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:06,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.65946 samples/s/p 1:59:56 } +2024-07-30 04:09:09,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1161/ 3125], loss: 0.220, per_step_time: 1415ms, lr: 5.9316794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:09,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.65298 samples/s/p 2:00:01 } +2024-07-30 04:09:12,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1163/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 5.9282843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:12,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.65810 samples/s/p 1:59:52 } +2024-07-30 04:09:15,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1165/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 5.92489e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:15,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.65772 samples/s/p 1:59:50 } +2024-07-30 04:09:17,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1167/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 5.921494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:17,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.65900 samples/s/p 1:59:45 } +2024-07-30 04:09:20,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1169/ 3125], loss: 0.143, per_step_time: 1414ms, lr: 5.9180984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:20,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.65439 samples/s/p 1:59:48 } +2024-07-30 04:09:23,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1171/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 5.914702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:23,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.65999 samples/s/p 1:59:38 } +2024-07-30 04:09:26,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1173/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 5.911305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:26,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.65615 samples/s/p 1:59:40 } +2024-07-30 04:09:29,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1175/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 5.9079075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:29,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.66030 samples/s/p 1:59:32 } +2024-07-30 04:09:32,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1177/ 3125], loss: 0.103, per_step_time: 1414ms, lr: 5.90451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:32,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.65747 samples/s/p 1:59:33 } +2024-07-30 04:09:34,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1179/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 5.9011118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:34,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.66023 samples/s/p 1:59:27 } +2024-07-30 04:09:37,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1181/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 5.897713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:37,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.66107 samples/s/p 1:59:23 } +2024-07-30 04:09:40,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1183/ 3125], loss: 0.202, per_step_time: 1415ms, lr: 5.8943137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:40,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.65263 samples/s/p 1:59:31 } +2024-07-30 04:09:43,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1185/ 3125], loss: 0.230, per_step_time: 1414ms, lr: 5.890914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:43,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.65645 samples/s/p 1:59:23 } +2024-07-30 04:09:46,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1187/ 3125], loss: 0.055, per_step_time: 1414ms, lr: 5.887515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:46,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.65480 samples/s/p 1:59:22 } +2024-07-30 04:09:49,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1189/ 3125], loss: 0.270, per_step_time: 1414ms, lr: 5.884114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:49,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |███████████████████████ | 5.65514 samples/s/p 1:59:19 } +2024-07-30 04:09:51,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1191/ 3125], loss: 0.289, per_step_time: 1414ms, lr: 5.880714e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:51,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |███████████████████████ | 5.65691 samples/s/p 1:59:14 } +2024-07-30 04:09:54,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1193/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 5.877312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:54,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.65919 samples/s/p 1:59:08 } +2024-07-30 04:09:57,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1195/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 5.8739106e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:57,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.66144 samples/s/p 1:59:03 } +2024-07-30 04:10:00,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1197/ 3125], loss: 0.185, per_step_time: 1412ms, lr: 5.870509e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:00,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.66234 samples/s/p 1:58:59 } +2024-07-30 04:10:03,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1199/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 5.867106e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:03,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.66145 samples/s/p 1:58:57 } +2024-07-30 04:10:06,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1201/ 3125], loss: 0.223, per_step_time: 1412ms, lr: 5.863704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:06,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.66196 samples/s/p 1:58:53 } +2024-07-30 04:10:08,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1203/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 5.8603005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:08,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.66045 samples/s/p 1:58:52 } +2024-07-30 04:10:11,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1205/ 3125], loss: 0.396, per_step_time: 1413ms, lr: 5.8568967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:11,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.66151 samples/s/p 1:58:48 } +2024-07-30 04:10:14,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1207/ 3125], loss: 0.055, per_step_time: 1440ms, lr: 5.8534924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:14,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.55176 samples/s/p 2:01:06 } +2024-07-30 04:10:17,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1209/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 5.8500887e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:17,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.66049 samples/s/p 1:58:44 } +2024-07-30 04:10:20,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1211/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 5.846684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:20,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.66080 samples/s/p 1:58:41 } +2024-07-30 04:10:23,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1213/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 5.843279e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:23,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.65959 samples/s/p 1:58:39 } +2024-07-30 04:10:26,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1215/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 5.8398728e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:26,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.66012 samples/s/p 1:58:36 } +2024-07-30 04:10:28,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1217/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 5.8364662e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:28,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.65975 samples/s/p 1:58:34 } +2024-07-30 04:10:31,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1219/ 3125], loss: 0.381, per_step_time: 1412ms, lr: 5.83306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:31,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.66192 samples/s/p 1:58:28 } +2024-07-30 04:10:34,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1221/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 5.829653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:34,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.66017 samples/s/p 1:58:27 } +2024-07-30 04:10:37,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1223/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 5.826246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:37,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.66010 samples/s/p 1:58:25 } +2024-07-30 04:10:40,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1225/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 5.8228384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:40,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.66018 samples/s/p 1:58:22 } +2024-07-30 04:10:43,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1227/ 3125], loss: 0.120, per_step_time: 1413ms, lr: 5.81943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:43,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.65969 samples/s/p 1:58:20 } +2024-07-30 04:10:45,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1229/ 3125], loss: 0.150, per_step_time: 1414ms, lr: 5.8160213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:45,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.65497 samples/s/p 1:58:23 } +2024-07-30 04:10:48,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1231/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 5.8126125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:48,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.66026 samples/s/p 1:58:13 } +2024-07-30 04:10:51,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1233/ 3125], loss: 0.504, per_step_time: 1414ms, lr: 5.8092037e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:51,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.65560 samples/s/p 1:58:16 } +2024-07-30 04:10:54,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1235/ 3125], loss: 0.378, per_step_time: 1415ms, lr: 5.805794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:54,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.64997 samples/s/p 1:58:20 } +2024-07-30 04:10:57,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1237/ 3125], loss: 0.145, per_step_time: 1414ms, lr: 5.8023843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:57,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.65427 samples/s/p 1:58:12 } +2024-07-30 04:11:00,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1239/ 3125], loss: 0.475, per_step_time: 1413ms, lr: 5.7989732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:00,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.66091 samples/s/p 1:58:01 } +2024-07-30 04:11:02,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1241/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 5.7955635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:02,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.66158 samples/s/p 1:57:57 } +2024-07-30 04:11:05,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1243/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 5.7921516e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:05,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.66142 samples/s/p 1:57:55 } +2024-07-30 04:11:08,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1245/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 5.7887405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:08,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.66084 samples/s/p 1:57:53 } +2024-07-30 04:11:11,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1247/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 5.7853285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:11,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.66138 samples/s/p 1:57:49 } +2024-07-30 04:11:14,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1249/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 5.781916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:14,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.66098 samples/s/p 1:57:47 } +2024-07-30 04:11:17,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1251/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 5.7785032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:17,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.66054 samples/s/p 1:57:45 } +2024-07-30 04:11:19,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1253/ 3125], loss: 0.485, per_step_time: 1414ms, lr: 5.7750904e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:19,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.65638 samples/s/p 1:57:47 } +2024-07-30 04:11:22,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1255/ 3125], loss: 0.230, per_step_time: 1414ms, lr: 5.7716775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:22,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.65376 samples/s/p 1:57:47 } +2024-07-30 04:11:25,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1257/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 5.7682632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:25,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.65916 samples/s/p 1:57:38 } +2024-07-30 04:11:28,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1259/ 3125], loss: 0.243, per_step_time: 1415ms, lr: 5.7648494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:28,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.65286 samples/s/p 1:57:43 } +2024-07-30 04:11:31,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1261/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 5.7614347e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:31,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.66071 samples/s/p 1:57:30 } +2024-07-30 04:11:34,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1263/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 5.75802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:34,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.65994 samples/s/p 1:57:28 } +2024-07-30 04:11:36,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1265/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 5.754605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:36,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.66081 samples/s/p 1:57:24 } +2024-07-30 04:11:39,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1267/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 5.7511893e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:39,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.65817 samples/s/p 1:57:25 } +2024-07-30 04:11:42,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1269/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 5.7477737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:42,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.66042 samples/s/p 1:57:19 } +2024-07-30 04:11:45,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1271/ 3125], loss: 0.181, per_step_time: 1414ms, lr: 5.7443576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:45,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.65515 samples/s/p 1:57:23 } +2024-07-30 04:11:48,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1273/ 3125], loss: 0.089, per_step_time: 1413ms, lr: 5.7409397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:48,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.66044 samples/s/p 1:57:14 } +2024-07-30 04:11:51,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1275/ 3125], loss: 0.160, per_step_time: 1412ms, lr: 5.737523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:51,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.66205 samples/s/p 1:57:09 } +2024-07-30 04:11:53,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1277/ 3125], loss: 0.148, per_step_time: 1413ms, lr: 5.7341063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:53,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.66004 samples/s/p 1:57:08 } +2024-07-30 04:11:56,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1279/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 5.7306884e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:56,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.65938 samples/s/p 1:57:06 } +2024-07-30 04:11:59,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1281/ 3125], loss: 0.137, per_step_time: 1414ms, lr: 5.7272705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:59,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.65560 samples/s/p 1:57:08 } +2024-07-30 04:12:02,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1283/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 5.723852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:02,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.65906 samples/s/p 1:57:01 } +2024-07-30 04:12:05,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1285/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 5.7204334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:05,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.66120 samples/s/p 1:56:56 } +2024-07-30 04:12:08,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1287/ 3125], loss: 0.295, per_step_time: 1414ms, lr: 5.717014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:08,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.65577 samples/s/p 1:57:00 } +2024-07-30 04:12:10,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1289/ 3125], loss: 0.341, per_step_time: 1413ms, lr: 5.713595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:10,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.65938 samples/s/p 1:56:52 } +2024-07-30 04:12:13,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1291/ 3125], loss: 0.583, per_step_time: 1416ms, lr: 5.7101756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:13,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.64667 samples/s/p 1:57:05 } +2024-07-30 04:12:16,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1293/ 3125], loss: 0.199, per_step_time: 1414ms, lr: 5.7067546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:16,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.65582 samples/s/p 1:56:51 } +2024-07-30 04:12:19,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1295/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 5.703335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:19,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.66136 samples/s/p 1:56:41 } +2024-07-30 04:12:22,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1297/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 5.6999133e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:22,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.66086 samples/s/p 1:56:39 } +2024-07-30 04:12:25,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1299/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 5.6964927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:25,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.66148 samples/s/p 1:56:36 } +2024-07-30 04:12:27,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1301/ 3125], loss: 0.448, per_step_time: 1413ms, lr: 5.6930708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:27,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.66158 samples/s/p 1:56:33 } +2024-07-30 04:12:30,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1303/ 3125], loss: 0.185, per_step_time: 1414ms, lr: 5.6896492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:30,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.65385 samples/s/p 1:56:39 } +2024-07-30 04:12:33,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1305/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 5.6862277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:33,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.65825 samples/s/p 1:56:31 } +2024-07-30 04:12:36,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1307/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 5.682805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:36,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.65956 samples/s/p 1:56:27 } +2024-07-30 04:12:39,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1309/ 3125], loss: 0.323, per_step_time: 1412ms, lr: 5.679382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:39,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.66175 samples/s/p 1:56:21 } +2024-07-30 04:12:42,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1311/ 3125], loss: 0.169, per_step_time: 1413ms, lr: 5.675959e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:42,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.66042 samples/s/p 1:56:20 } +2024-07-30 04:12:44,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1313/ 3125], loss: 0.169, per_step_time: 1413ms, lr: 5.6725357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:44,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.66022 samples/s/p 1:56:17 } +2024-07-30 04:12:47,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1315/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 5.669112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:47,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.66120 samples/s/p 1:56:13 } +2024-07-30 04:12:50,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1317/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 5.665688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:50,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.66092 samples/s/p 1:56:11 } +2024-07-30 04:12:53,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1319/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 5.6622634e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:53,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.66066 samples/s/p 1:56:08 } +2024-07-30 04:12:56,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1321/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 5.658839e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:56,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.66133 samples/s/p 1:56:05 } +2024-07-30 04:12:59,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1323/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 5.6554136e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:59,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.65826 samples/s/p 1:56:06 } +2024-07-30 04:13:01,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1325/ 3125], loss: 0.387, per_step_time: 1413ms, lr: 5.651989e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:01,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.65788 samples/s/p 1:56:03 } +2024-07-30 04:13:04,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1327/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 5.6485633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:04,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.66125 samples/s/p 1:55:56 } +2024-07-30 04:13:07,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1329/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 5.645137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:07,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.65894 samples/s/p 1:55:56 } +2024-07-30 04:13:10,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1331/ 3125], loss: 0.310, per_step_time: 1415ms, lr: 5.6417107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:10,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.65138 samples/s/p 1:56:03 } +2024-07-30 04:13:13,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1333/ 3125], loss: 0.272, per_step_time: 1415ms, lr: 5.6382846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:13,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.65361 samples/s/p 1:55:57 } +2024-07-30 04:13:16,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1335/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 5.6348576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:16,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.65877 samples/s/p 1:55:48 } +2024-07-30 04:13:18,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1337/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 5.63143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:18,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.66056 samples/s/p 1:55:43 } +2024-07-30 04:13:21,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1339/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 5.6280032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:21,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.66150 samples/s/p 1:55:39 } +2024-07-30 04:13:24,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1341/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 5.624575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:24,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.66051 samples/s/p 1:55:37 } +2024-07-30 04:13:27,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1343/ 3125], loss: 0.159, per_step_time: 1414ms, lr: 5.621147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:27,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.65717 samples/s/p 1:55:39 } +2024-07-30 04:13:30,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1345/ 3125], loss: 0.167, per_step_time: 1414ms, lr: 5.6177187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:30,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.65655 samples/s/p 1:55:37 } +2024-07-30 04:13:33,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1347/ 3125], loss: 0.235, per_step_time: 1414ms, lr: 5.61429e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:33,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.65591 samples/s/p 1:55:35 } +2024-07-30 04:13:35,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1349/ 3125], loss: 0.205, per_step_time: 1414ms, lr: 5.6108615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:35,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.65767 samples/s/p 1:55:30 } +2024-07-30 04:13:38,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1351/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 5.607432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:38,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.65907 samples/s/p 1:55:25 } +2024-07-30 04:13:41,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1353/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 5.604002e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:41,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.65857 samples/s/p 1:55:23 } +2024-07-30 04:13:44,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1355/ 3125], loss: 0.400, per_step_time: 1412ms, lr: 5.600573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:44,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.66230 samples/s/p 1:55:15 } +2024-07-30 04:13:47,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1357/ 3125], loss: 0.158, per_step_time: 1413ms, lr: 5.597143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:47,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.65980 samples/s/p 1:55:16 } +2024-07-30 04:13:50,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1359/ 3125], loss: 0.180, per_step_time: 1414ms, lr: 5.593712e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:50,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.65401 samples/s/p 1:55:20 } +2024-07-30 04:13:52,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1361/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 5.590282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:52,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.66117 samples/s/p 1:55:08 } +2024-07-30 04:13:55,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1363/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 5.5868504e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:55,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.65908 samples/s/p 1:55:08 } +2024-07-30 04:13:58,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1365/ 3125], loss: 0.329, per_step_time: 1414ms, lr: 5.583419e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:58,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.65519 samples/s/p 1:55:10 } +2024-07-30 04:14:01,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1367/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 5.579988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:01,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.66077 samples/s/p 1:55:00 } +2024-07-30 04:14:04,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1369/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 5.5765563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:04,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.66125 samples/s/p 1:54:57 } +2024-07-30 04:14:07,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1371/ 3125], loss: 0.182, per_step_time: 1412ms, lr: 5.5731243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:07,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |███████████████████████ | 5.66182 samples/s/p 1:54:53 } +2024-07-30 04:14:09,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1373/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 5.5696914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:09,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |███████████████████████ | 5.65919 samples/s/p 1:54:54 } +2024-07-30 04:14:12,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1375/ 3125], loss: 0.419, per_step_time: 1412ms, lr: 5.566259e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:12,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.66183 samples/s/p 1:54:48 } +2024-07-30 04:14:15,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1377/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 5.562826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:15,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.66001 samples/s/p 1:54:47 } +2024-07-30 04:14:18,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1379/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 5.5593937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:18,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.65822 samples/s/p 1:54:46 } +2024-07-30 04:14:21,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1381/ 3125], loss: 0.175, per_step_time: 1412ms, lr: 5.55596e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:21,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.66194 samples/s/p 1:54:39 } +2024-07-30 04:14:24,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1383/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 5.5525265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:24,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.65783 samples/s/p 1:54:41 } +2024-07-30 04:14:26,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1385/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 5.5490923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:26,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.65795 samples/s/p 1:54:38 } +2024-07-30 04:14:29,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1387/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 5.5456576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:29,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.65986 samples/s/p 1:54:33 } +2024-07-30 04:14:32,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1389/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 5.5422233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:32,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.65990 samples/s/p 1:54:30 } +2024-07-30 04:14:35,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1391/ 3125], loss: 0.410, per_step_time: 1413ms, lr: 5.538789e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:35,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.65952 samples/s/p 1:54:28 } +2024-07-30 04:14:38,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1393/ 3125], loss: 0.129, per_step_time: 1414ms, lr: 5.5353544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:38,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.65706 samples/s/p 1:54:28 } +2024-07-30 04:14:41,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1395/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 5.5319188e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:41,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.65865 samples/s/p 1:54:23 } +2024-07-30 04:14:43,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1397/ 3125], loss: 0.091, per_step_time: 1414ms, lr: 5.5284827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:43,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.65738 samples/s/p 1:54:22 } +2024-07-30 04:14:46,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1399/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 5.5250475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:46,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.65869 samples/s/p 1:54:18 } +2024-07-30 04:14:49,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1401/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 5.521611e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:49,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.65824 samples/s/p 1:54:15 } +2024-07-30 04:14:52,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1403/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 5.5181754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:52,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.65993 samples/s/p 1:54:10 } +2024-07-30 04:14:55,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1405/ 3125], loss: 0.088, per_step_time: 1413ms, lr: 5.514739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:55,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.66015 samples/s/p 1:54:07 } +2024-07-30 04:14:58,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1407/ 3125], loss: 0.266, per_step_time: 1414ms, lr: 5.5113014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:58,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.65741 samples/s/p 1:54:08 } +2024-07-30 04:15:00,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1409/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 5.507865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:00,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.65867 samples/s/p 1:54:04 } +2024-07-30 04:15:03,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1411/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 5.5044275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:03,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.66103 samples/s/p 1:53:58 } +2024-07-30 04:15:06,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1413/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 5.5009905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:06,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.66057 samples/s/p 1:53:56 } +2024-07-30 04:15:09,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1415/ 3125], loss: 0.205, per_step_time: 1414ms, lr: 5.497553e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:09,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.65685 samples/s/p 1:53:57 } +2024-07-30 04:15:12,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1417/ 3125], loss: 0.527, per_step_time: 1413ms, lr: 5.4941147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:12,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.66104 samples/s/p 1:53:49 } +2024-07-30 04:15:15,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1419/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 5.490676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:15,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.66125 samples/s/p 1:53:46 } +2024-07-30 04:15:17,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1421/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 5.487238e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:17,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.65903 samples/s/p 1:53:46 } +2024-07-30 04:15:20,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1423/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 5.483799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:20,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.65798 samples/s/p 1:53:45 } +2024-07-30 04:15:23,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1425/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 5.480361e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:23,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.65911 samples/s/p 1:53:40 } +2024-07-30 04:15:26,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1427/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 5.4769216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:26,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.66073 samples/s/p 1:53:36 } +2024-07-30 04:15:29,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1429/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 5.4734824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:29,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.65846 samples/s/p 1:53:35 } +2024-07-30 04:15:32,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1431/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 5.470042e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:32,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.66026 samples/s/p 1:53:30 } +2024-07-30 04:15:34,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1433/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 5.466603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:34,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.66100 samples/s/p 1:53:27 } +2024-07-30 04:15:37,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1435/ 3125], loss: 0.118, per_step_time: 1412ms, lr: 5.4631632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:37,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.66279 samples/s/p 1:53:22 } +2024-07-30 04:15:40,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1437/ 3125], loss: 0.206, per_step_time: 1412ms, lr: 5.4597226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:40,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.66191 samples/s/p 1:53:20 } +2024-07-30 04:15:43,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1439/ 3125], loss: 0.162, per_step_time: 1412ms, lr: 5.4562825e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:43,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.66175 samples/s/p 1:53:17 } +2024-07-30 04:15:46,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1441/ 3125], loss: 0.353, per_step_time: 1413ms, lr: 5.4528414e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:46,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.66156 samples/s/p 1:53:15 } +2024-07-30 04:15:49,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1443/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 5.449401e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:49,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.65867 samples/s/p 1:53:15 } +2024-07-30 04:15:51,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1445/ 3125], loss: 0.317, per_step_time: 1415ms, lr: 5.4459592e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:51,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.65153 samples/s/p 1:53:21 } +2024-07-30 04:15:54,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1447/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 5.4425186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:54,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.65810 samples/s/p 1:53:10 } +2024-07-30 04:15:57,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1449/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 5.4390775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:57,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.65946 samples/s/p 1:53:06 } +2024-07-30 04:16:00,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1451/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 5.435635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:00,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.65961 samples/s/p 1:53:03 } +2024-07-30 04:16:03,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1453/ 3125], loss: 0.465, per_step_time: 1415ms, lr: 5.432193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:03,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.65217 samples/s/p 1:53:09 } +2024-07-30 04:16:06,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1455/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 5.428751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:06,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.66040 samples/s/p 1:52:56 } +2024-07-30 04:16:09,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1457/ 3125], loss: 0.395, per_step_time: 1414ms, lr: 5.4253087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:09,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.65711 samples/s/p 1:52:58 } +2024-07-30 04:16:11,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1459/ 3125], loss: 0.303, per_step_time: 1412ms, lr: 5.4218663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:11,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.66215 samples/s/p 1:52:49 } +2024-07-30 04:16:14,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1461/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 5.418424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:14,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.66086 samples/s/p 1:52:47 } +2024-07-30 04:16:17,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1463/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 5.4149805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:17,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.65842 samples/s/p 1:52:47 } +2024-07-30 04:16:20,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1465/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 5.4115376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:20,341 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.66167 samples/s/p 1:52:41 } +2024-07-30 04:16:23,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1467/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 5.408094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:23,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.66118 samples/s/p 1:52:39 } +2024-07-30 04:16:26,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1469/ 3125], loss: 0.137, per_step_time: 1414ms, lr: 5.4046504e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:26,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.65695 samples/s/p 1:52:41 } +2024-07-30 04:16:28,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1471/ 3125], loss: 0.181, per_step_time: 1414ms, lr: 5.401207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:28,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.65376 samples/s/p 1:52:42 } +2024-07-30 04:16:31,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1473/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 5.3977633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:31,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.65882 samples/s/p 1:52:33 } +2024-07-30 04:16:34,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1475/ 3125], loss: 0.199, per_step_time: 1412ms, lr: 5.3943186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:34,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.66258 samples/s/p 1:52:26 } +2024-07-30 04:16:37,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1477/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 5.390875e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:37,347 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.65977 samples/s/p 1:52:26 } +2024-07-30 04:16:40,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1479/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 5.38743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:40,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.65856 samples/s/p 1:52:25 } +2024-07-30 04:16:43,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1481/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 5.3839854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:43,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.65861 samples/s/p 1:52:22 } +2024-07-30 04:16:45,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1483/ 3125], loss: 0.105, per_step_time: 1413ms, lr: 5.380541e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:45,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.65876 samples/s/p 1:52:19 } +2024-07-30 04:16:48,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1485/ 3125], loss: 0.235, per_step_time: 1414ms, lr: 5.377095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:48,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.65770 samples/s/p 1:52:17 } +2024-07-30 04:16:51,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1487/ 3125], loss: 0.394, per_step_time: 1413ms, lr: 5.3736508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:51,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.66159 samples/s/p 1:52:10 } +2024-07-30 04:16:54,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1489/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 5.3702047e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:54,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.66048 samples/s/p 1:52:08 } +2024-07-30 04:16:57,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1491/ 3125], loss: 0.266, per_step_time: 1412ms, lr: 5.366759e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:57,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.66267 samples/s/p 1:52:03 } +2024-07-30 04:17:00,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1493/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 5.363314e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:00,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.66075 samples/s/p 1:52:02 } +2024-07-30 04:17:02,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1495/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 5.359868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:02,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.65987 samples/s/p 1:52:01 } +2024-07-30 04:17:05,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1497/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 5.3564213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:05,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.65930 samples/s/p 1:51:58 } +2024-07-30 04:17:08,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1499/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 5.3529757e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:08,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.66157 samples/s/p 1:51:53 } +2024-07-30 04:17:11,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1501/ 3125], loss: 0.433, per_step_time: 1413ms, lr: 5.349529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:11,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.66171 samples/s/p 1:51:50 } +2024-07-30 04:17:14,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1503/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 5.346082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:14,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.66102 samples/s/p 1:51:48 } +2024-07-30 04:17:17,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1505/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 5.342636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:17,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.66116 samples/s/p 1:51:45 } +2024-07-30 04:17:19,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1507/ 3125], loss: 0.189, per_step_time: 1415ms, lr: 5.3391886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:19,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.65168 samples/s/p 1:51:53 } +2024-07-30 04:17:22,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1509/ 3125], loss: 0.314, per_step_time: 1414ms, lr: 5.3357408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:22,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.65658 samples/s/p 1:51:45 } +2024-07-30 04:17:25,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1511/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 5.3322938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:25,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.65972 samples/s/p 1:51:38 } +2024-07-30 04:17:28,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1513/ 3125], loss: 0.266, per_step_time: 1414ms, lr: 5.3288472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:28,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.65727 samples/s/p 1:51:38 } +2024-07-30 04:17:31,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1515/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 5.3253993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:31,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.65891 samples/s/p 1:51:33 } +2024-07-30 04:17:34,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1517/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 5.321952e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:34,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.65974 samples/s/p 1:51:30 } +2024-07-30 04:17:36,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1519/ 3125], loss: 0.241, per_step_time: 1412ms, lr: 5.318504e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:36,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.66230 samples/s/p 1:51:24 } +2024-07-30 04:17:39,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1521/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 5.3150557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:39,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.66109 samples/s/p 1:51:22 } +2024-07-30 04:17:42,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1523/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 5.311608e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:42,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.66159 samples/s/p 1:51:19 } +2024-07-30 04:17:45,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1525/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 5.3081594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:45,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.66101 samples/s/p 1:51:17 } +2024-07-30 04:17:48,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1527/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 5.3047115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:48,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.66030 samples/s/p 1:51:15 } +2024-07-30 04:17:51,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1529/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 5.301262e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:51,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.66094 samples/s/p 1:51:11 } +2024-07-30 04:17:53,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1531/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 5.2978135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:53,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.66155 samples/s/p 1:51:08 } +2024-07-30 04:17:56,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1533/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 5.2943647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:56,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.65859 samples/s/p 1:51:08 } +2024-07-30 04:17:59,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1535/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 5.290916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:59,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.65994 samples/s/p 1:51:04 } +2024-07-30 04:18:02,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1537/ 3125], loss: 0.267, per_step_time: 1414ms, lr: 5.287467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:02,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.65750 samples/s/p 1:51:04 } +2024-07-30 04:18:05,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1539/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 5.2840173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:05,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.65947 samples/s/p 1:50:59 } +2024-07-30 04:18:08,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1541/ 3125], loss: 0.258, per_step_time: 1412ms, lr: 5.280567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:08,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.66244 samples/s/p 1:50:52 } +2024-07-30 04:18:10,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1543/ 3125], loss: 0.397, per_step_time: 1414ms, lr: 5.277118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:10,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.65462 samples/s/p 1:50:59 } +2024-07-30 04:18:13,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1545/ 3125], loss: 0.230, per_step_time: 1412ms, lr: 5.2736686e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:13,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.66192 samples/s/p 1:50:47 } +2024-07-30 04:18:16,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1547/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 5.270219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:16,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.66166 samples/s/p 1:50:45 } +2024-07-30 04:18:19,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1549/ 3125], loss: 0.224, per_step_time: 1414ms, lr: 5.2667688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:19,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.65752 samples/s/p 1:50:47 } +2024-07-30 04:18:22,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1551/ 3125], loss: 0.416, per_step_time: 1414ms, lr: 5.263318e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:22,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.65462 samples/s/p 1:50:48 } +2024-07-30 04:18:25,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1553/ 3125], loss: 0.129, per_step_time: 1413ms, lr: 5.259868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:25,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.65819 samples/s/p 1:50:40 } +2024-07-30 04:18:27,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1555/ 3125], loss: 0.323, per_step_time: 1414ms, lr: 5.256418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:27,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.65573 samples/s/p 1:50:41 } +2024-07-30 04:18:30,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1557/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 5.252967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:30,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.66143 samples/s/p 1:50:31 } +2024-07-30 04:18:33,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1559/ 3125], loss: 0.420, per_step_time: 1413ms, lr: 5.2495175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:33,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |████████████████████████ | 5.65916 samples/s/p 1:50:31 } +2024-07-30 04:18:36,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1561/ 3125], loss: 0.121, per_step_time: 1414ms, lr: 5.2460664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:36,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |████████████████████████ | 5.65753 samples/s/p 1:50:30 } +2024-07-30 04:18:39,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1563/ 3125], loss: 0.212, per_step_time: 1414ms, lr: 5.2426153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:39,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.65512 samples/s/p 1:50:30 } +2024-07-30 04:18:42,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1565/ 3125], loss: 0.401, per_step_time: 1413ms, lr: 5.2391642e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:42,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.65808 samples/s/p 1:50:24 } +2024-07-30 04:18:44,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1567/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 5.235713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:44,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.66081 samples/s/p 1:50:18 } +2024-07-30 04:18:47,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1569/ 3125], loss: 0.161, per_step_time: 1415ms, lr: 5.232262e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:47,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.65294 samples/s/p 1:50:24 } +2024-07-30 04:18:50,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1571/ 3125], loss: 0.227, per_step_time: 1412ms, lr: 5.2288115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:50,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.66309 samples/s/p 1:50:09 } +2024-07-30 04:18:53,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1573/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 5.225359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:53,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.65949 samples/s/p 1:50:11 } +2024-07-30 04:18:56,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1575/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 5.2219075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:56,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.66140 samples/s/p 1:50:06 } +2024-07-30 04:18:59,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1577/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 5.2184564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:59,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.65839 samples/s/p 1:50:06 } +2024-07-30 04:19:01,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1579/ 3125], loss: 0.439, per_step_time: 1413ms, lr: 5.2150044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:01,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.65904 samples/s/p 1:50:03 } +2024-07-30 04:19:04,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1581/ 3125], loss: 0.413, per_step_time: 1416ms, lr: 5.2115533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:04,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.64863 samples/s/p 1:50:12 } +2024-07-30 04:19:07,565 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1583/ 3125], loss: 0.246, per_step_time: 1412ms, lr: 5.2081014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:07,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.66278 samples/s/p 1:49:53 } +2024-07-30 04:19:10,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1585/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 5.204649e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:10,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.65977 samples/s/p 1:49:53 } +2024-07-30 04:19:13,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1587/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 5.2011965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:13,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.65942 samples/s/p 1:49:51 } +2024-07-30 04:19:16,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1589/ 3125], loss: 0.198, per_step_time: 1416ms, lr: 5.197744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:16,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.64714 samples/s/p 1:50:02 } +2024-07-30 04:19:18,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1591/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 5.1942925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:18,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.66056 samples/s/p 1:49:44 } +2024-07-30 04:19:21,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1593/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 5.19084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:21,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.66076 samples/s/p 1:49:41 } +2024-07-30 04:19:24,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1595/ 3125], loss: 0.381, per_step_time: 1413ms, lr: 5.187388e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:24,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.66157 samples/s/p 1:49:37 } +2024-07-30 04:19:27,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1597/ 3125], loss: 0.323, per_step_time: 1413ms, lr: 5.1839343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:27,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.65866 samples/s/p 1:49:38 } +2024-07-30 04:19:30,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1599/ 3125], loss: 0.192, per_step_time: 1412ms, lr: 5.1804823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:30,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.66198 samples/s/p 1:49:31 } +2024-07-30 04:19:33,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1601/ 3125], loss: 0.433, per_step_time: 1413ms, lr: 5.17703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:33,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.65958 samples/s/p 1:49:31 } +2024-07-30 04:19:35,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1603/ 3125], loss: 0.372, per_step_time: 1414ms, lr: 5.1735765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:35,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.65616 samples/s/p 1:49:32 } +2024-07-30 04:19:38,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1605/ 3125], loss: 0.489, per_step_time: 1412ms, lr: 5.170124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:38,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.66215 samples/s/p 1:49:22 } +2024-07-30 04:19:41,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1607/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 5.166671e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:41,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.65847 samples/s/p 1:49:24 } +2024-07-30 04:19:44,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1609/ 3125], loss: 0.203, per_step_time: 1414ms, lr: 5.163218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:44,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.65558 samples/s/p 1:49:24 } +2024-07-30 04:19:47,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1611/ 3125], loss: 0.286, per_step_time: 1414ms, lr: 5.159764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:47,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.65714 samples/s/p 1:49:20 } +2024-07-30 04:19:50,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1613/ 3125], loss: 0.345, per_step_time: 1414ms, lr: 5.156311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:50,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.65632 samples/s/p 1:49:18 } +2024-07-30 04:19:52,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1615/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 5.152858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:52,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.65839 samples/s/p 1:49:13 } +2024-07-30 04:19:55,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1617/ 3125], loss: 0.555, per_step_time: 1413ms, lr: 5.149405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:55,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.66136 samples/s/p 1:49:06 } +2024-07-30 04:19:58,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1619/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 5.1459515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:58,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.66074 samples/s/p 1:49:04 } +2024-07-30 04:20:01,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1621/ 3125], loss: 0.141, per_step_time: 1413ms, lr: 5.1424972e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:01,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.66066 samples/s/p 1:49:01 } +2024-07-30 04:20:04,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1623/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 5.1390443e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:04,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.66022 samples/s/p 1:48:59 } +2024-07-30 04:20:07,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1625/ 3125], loss: 0.078, per_step_time: 1417ms, lr: 5.1355905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:07,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.64338 samples/s/p 1:49:16 } +2024-07-30 04:20:09,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1627/ 3125], loss: 0.106, per_step_time: 1414ms, lr: 5.1321367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:09,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.65583 samples/s/p 1:48:59 } +2024-07-30 04:20:12,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1629/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 5.1286834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:12,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.65894 samples/s/p 1:48:52 } +2024-07-30 04:20:15,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1631/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 5.125229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:15,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.65987 samples/s/p 1:48:48 } +2024-07-30 04:20:18,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1633/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 5.1217744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:18,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.66091 samples/s/p 1:48:44 } +2024-07-30 04:20:21,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1635/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 5.118321e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:21,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.65799 samples/s/p 1:48:45 } +2024-07-30 04:20:24,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1637/ 3125], loss: 0.503, per_step_time: 1413ms, lr: 5.1148677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:24,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.65949 samples/s/p 1:48:40 } +2024-07-30 04:20:26,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1639/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 5.111413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:26,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.66084 samples/s/p 1:48:36 } +2024-07-30 04:20:29,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1641/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 5.107959e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:29,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.65896 samples/s/p 1:48:35 } +2024-07-30 04:20:32,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1643/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 5.104505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:32,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.66103 samples/s/p 1:48:30 } +2024-07-30 04:20:35,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1645/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 5.1010506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:35,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.66051 samples/s/p 1:48:28 } +2024-07-30 04:20:38,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1647/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 5.097596e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:38,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.66046 samples/s/p 1:48:25 } +2024-07-30 04:20:41,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1649/ 3125], loss: 0.307, per_step_time: 1412ms, lr: 5.0941417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:41,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.66220 samples/s/p 1:48:20 } +2024-07-30 04:20:43,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1651/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 5.090688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:43,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.66157 samples/s/p 1:48:18 } +2024-07-30 04:20:46,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1653/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 5.087233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:46,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.66012 samples/s/p 1:48:17 } +2024-07-30 04:20:49,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1655/ 3125], loss: 0.417, per_step_time: 1413ms, lr: 5.0837784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:49,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.66028 samples/s/p 1:48:14 } +2024-07-30 04:20:52,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1657/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 5.080324e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:52,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.65961 samples/s/p 1:48:12 } +2024-07-30 04:20:55,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1659/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 5.0768704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:55,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.66108 samples/s/p 1:48:07 } +2024-07-30 04:20:58,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1661/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 5.0734147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:58,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.65999 samples/s/p 1:48:06 } +2024-07-30 04:21:00,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1663/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 5.069961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:00,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.65902 samples/s/p 1:48:04 } +2024-07-30 04:21:03,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1665/ 3125], loss: 0.072, per_step_time: 1413ms, lr: 5.0665058e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:03,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.65851 samples/s/p 1:48:02 } +2024-07-30 04:21:06,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1667/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 5.0630515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:06,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.65987 samples/s/p 1:47:57 } +2024-07-30 04:21:09,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1669/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 5.0595963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:09,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.65859 samples/s/p 1:47:56 } +2024-07-30 04:21:12,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1671/ 3125], loss: 0.339, per_step_time: 1414ms, lr: 5.056142e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:12,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.65764 samples/s/p 1:47:54 } +2024-07-30 04:21:15,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1673/ 3125], loss: 0.259, per_step_time: 1415ms, lr: 5.0526874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:15,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.65115 samples/s/p 1:47:59 } +2024-07-30 04:21:17,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1675/ 3125], loss: 0.445, per_step_time: 1413ms, lr: 5.049232e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:17,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.65913 samples/s/p 1:47:47 } +2024-07-30 04:21:20,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1677/ 3125], loss: 0.251, per_step_time: 1415ms, lr: 5.0457775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:20,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.65313 samples/s/p 1:47:51 } +2024-07-30 04:21:23,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1679/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 5.0423228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:23,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.66127 samples/s/p 1:47:39 } +2024-07-30 04:21:26,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1681/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 5.038868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:26,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.66120 samples/s/p 1:47:36 } +2024-07-30 04:21:29,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1683/ 3125], loss: 0.127, per_step_time: 1413ms, lr: 5.035413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:29,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.66020 samples/s/p 1:47:34 } +2024-07-30 04:21:32,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1685/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 5.031958e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:32,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.65945 samples/s/p 1:47:32 } +2024-07-30 04:21:34,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1687/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 5.028503e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:34,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.65882 samples/s/p 1:47:30 } +2024-07-30 04:21:37,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1689/ 3125], loss: 0.306, per_step_time: 1414ms, lr: 5.0250483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:37,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.65707 samples/s/p 1:47:29 } +2024-07-30 04:21:40,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1691/ 3125], loss: 0.229, per_step_time: 1412ms, lr: 5.0215936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:40,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.66273 samples/s/p 1:47:20 } +2024-07-30 04:21:43,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1693/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 5.018139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:43,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.66090 samples/s/p 1:47:19 } +2024-07-30 04:21:46,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1695/ 3125], loss: 0.254, per_step_time: 1414ms, lr: 5.014684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:46,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.65431 samples/s/p 1:47:24 } +2024-07-30 04:21:49,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1697/ 3125], loss: 0.421, per_step_time: 1413ms, lr: 5.011229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:49,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.65971 samples/s/p 1:47:15 } +2024-07-30 04:21:51,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1699/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 5.0077733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:51,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.65993 samples/s/p 1:47:12 } +2024-07-30 04:21:54,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1701/ 3125], loss: 0.179, per_step_time: 1412ms, lr: 5.0043186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:54,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.66264 samples/s/p 1:47:06 } +2024-07-30 04:21:57,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1703/ 3125], loss: 0.478, per_step_time: 1413ms, lr: 5.0008643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:57,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.65959 samples/s/p 1:47:07 } +2024-07-30 04:22:00,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1705/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 4.997409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:00,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.66002 samples/s/p 1:47:04 } +2024-07-30 04:22:03,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1707/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 4.993954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:03,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.66128 samples/s/p 1:46:59 } +2024-07-30 04:22:06,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1709/ 3125], loss: 0.307, per_step_time: 1414ms, lr: 4.9904984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:06,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.65726 samples/s/p 1:47:01 } +2024-07-30 04:22:08,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1711/ 3125], loss: 0.178, per_step_time: 1412ms, lr: 4.987043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:08,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.66295 samples/s/p 1:46:52 } +2024-07-30 04:22:11,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1713/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 4.9835885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:11,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.66040 samples/s/p 1:46:52 } +2024-07-30 04:22:14,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1715/ 3125], loss: 0.193, per_step_time: 1412ms, lr: 4.980134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:14,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.66318 samples/s/p 1:46:46 } +2024-07-30 04:22:17,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1717/ 3125], loss: 0.197, per_step_time: 1413ms, lr: 4.9766795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:17,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.65852 samples/s/p 1:46:48 } +2024-07-30 04:22:20,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1719/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 4.9732243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:20,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.66062 samples/s/p 1:46:43 } +2024-07-30 04:22:23,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1721/ 3125], loss: 0.137, per_step_time: 1413ms, lr: 4.9697696e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:23,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.66060 samples/s/p 1:46:40 } +2024-07-30 04:22:25,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1723/ 3125], loss: 0.300, per_step_time: 1414ms, lr: 4.9663136e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:25,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.65454 samples/s/p 1:46:44 } +2024-07-30 04:22:28,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1725/ 3125], loss: 0.293, per_step_time: 1413ms, lr: 4.962859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:28,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.65832 samples/s/p 1:46:37 } +2024-07-30 04:22:31,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1727/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 4.9594046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:31,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.66154 samples/s/p 1:46:31 } +2024-07-30 04:22:34,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1729/ 3125], loss: 0.349, per_step_time: 1413ms, lr: 4.95595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:34,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.66101 samples/s/p 1:46:28 } +2024-07-30 04:22:37,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1731/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 4.952495e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:37,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.65777 samples/s/p 1:46:29 } +2024-07-30 04:22:40,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1733/ 3125], loss: 0.057, per_step_time: 1413ms, lr: 4.9490404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:40,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.65986 samples/s/p 1:46:24 } +2024-07-30 04:22:42,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1735/ 3125], loss: 0.251, per_step_time: 1414ms, lr: 4.9455857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:42,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.65711 samples/s/p 1:46:24 } +2024-07-30 04:22:45,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1737/ 3125], loss: 0.193, per_step_time: 1415ms, lr: 4.9421305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:45,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.65174 samples/s/p 1:46:28 } +2024-07-30 04:22:48,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1739/ 3125], loss: 0.235, per_step_time: 1413ms, lr: 4.938676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:48,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.66022 samples/s/p 1:46:15 } +2024-07-30 04:22:51,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1741/ 3125], loss: 0.430, per_step_time: 1412ms, lr: 4.935221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:51,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.66267 samples/s/p 1:46:10 } +2024-07-30 04:22:54,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1743/ 3125], loss: 0.451, per_step_time: 1413ms, lr: 4.9317664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:54,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.66115 samples/s/p 1:46:09 } +2024-07-30 04:22:57,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1745/ 3125], loss: 0.326, per_step_time: 1412ms, lr: 4.928312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:57,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.66206 samples/s/p 1:46:05 } +2024-07-30 04:22:59,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1747/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 4.924858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:59,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |█████████████████████████ | 5.66134 samples/s/p 1:46:03 } +2024-07-30 04:23:02,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1749/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 4.9214036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:02,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |█████████████████████████ | 5.65947 samples/s/p 1:46:02 } +2024-07-30 04:23:05,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1751/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 4.917948e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:05,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.66152 samples/s/p 1:45:57 } +2024-07-30 04:23:08,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1753/ 3125], loss: 0.163, per_step_time: 1414ms, lr: 4.9144937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:08,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.65732 samples/s/p 1:45:59 } +2024-07-30 04:23:11,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1755/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 4.911039e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:11,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.65862 samples/s/p 1:45:54 } +2024-07-30 04:23:14,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1757/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 4.9075848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:14,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.65419 samples/s/p 1:45:57 } +2024-07-30 04:23:16,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1759/ 3125], loss: 0.143, per_step_time: 1412ms, lr: 4.904131e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:16,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.66229 samples/s/p 1:45:45 } +2024-07-30 04:23:19,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1761/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 4.9006767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:19,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.65859 samples/s/p 1:45:46 } +2024-07-30 04:23:22,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1763/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 4.8972224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:22,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.66159 samples/s/p 1:45:40 } +2024-07-30 04:23:25,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1765/ 3125], loss: 0.257, per_step_time: 1412ms, lr: 4.8937677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:25,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.66226 samples/s/p 1:45:36 } +2024-07-30 04:23:28,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1767/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 4.8903134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:28,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.66090 samples/s/p 1:45:35 } +2024-07-30 04:23:31,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1769/ 3125], loss: 0.370, per_step_time: 1414ms, lr: 4.8868596e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:31,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.65691 samples/s/p 1:45:37 } +2024-07-30 04:23:33,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1771/ 3125], loss: 0.291, per_step_time: 1413ms, lr: 4.883406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:33,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.65933 samples/s/p 1:45:31 } +2024-07-30 04:23:36,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1773/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 4.879952e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:36,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.66032 samples/s/p 1:45:27 } +2024-07-30 04:23:39,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1775/ 3125], loss: 0.125, per_step_time: 1413ms, lr: 4.8764978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:39,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.66113 samples/s/p 1:45:23 } +2024-07-30 04:23:42,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1777/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 4.873044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:42,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.66042 samples/s/p 1:45:21 } +2024-07-30 04:23:45,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1779/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 4.8695906e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:45,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.66120 samples/s/p 1:45:18 } +2024-07-30 04:23:48,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1781/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 4.866136e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:48,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.65891 samples/s/p 1:45:17 } +2024-07-30 04:23:50,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1783/ 3125], loss: 0.181, per_step_time: 1412ms, lr: 4.8626825e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:50,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.66331 samples/s/p 1:45:10 } +2024-07-30 04:23:53,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1785/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 4.859229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:53,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.66086 samples/s/p 1:45:09 } +2024-07-30 04:23:56,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1787/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 4.855775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:56,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.66015 samples/s/p 1:45:07 } +2024-07-30 04:23:59,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1789/ 3125], loss: 0.286, per_step_time: 1414ms, lr: 4.852322e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:59,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.65642 samples/s/p 1:45:09 } +2024-07-30 04:24:02,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1791/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 4.8488687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:02,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.65783 samples/s/p 1:45:04 } +2024-07-30 04:24:05,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1793/ 3125], loss: 0.276, per_step_time: 1414ms, lr: 4.845416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:05,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.65652 samples/s/p 1:45:03 } +2024-07-30 04:24:07,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1795/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 4.8419615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:07,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.65809 samples/s/p 1:44:58 } +2024-07-30 04:24:10,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1797/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 4.8385086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:10,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.65856 samples/s/p 1:44:55 } +2024-07-30 04:24:13,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1799/ 3125], loss: 0.273, per_step_time: 1412ms, lr: 4.8350553e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:13,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.66226 samples/s/p 1:44:48 } +2024-07-30 04:24:16,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1801/ 3125], loss: 0.288, per_step_time: 1415ms, lr: 4.8316024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:16,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.65166 samples/s/p 1:44:57 } +2024-07-30 04:24:19,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1803/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 4.82815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:19,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.66091 samples/s/p 1:44:44 } +2024-07-30 04:24:22,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1805/ 3125], loss: 0.420, per_step_time: 1412ms, lr: 4.824697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:22,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.66298 samples/s/p 1:44:39 } +2024-07-30 04:24:25,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1807/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 4.821244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:25,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.66009 samples/s/p 1:44:39 } +2024-07-30 04:24:27,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1809/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 4.8177913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:27,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.66153 samples/s/p 1:44:35 } +2024-07-30 04:24:30,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1811/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 4.814338e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:30,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.66158 samples/s/p 1:44:32 } +2024-07-30 04:24:33,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1813/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 4.810886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:33,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.65900 samples/s/p 1:44:32 } +2024-07-30 04:24:36,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1815/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 4.8074335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:36,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.66076 samples/s/p 1:44:27 } +2024-07-30 04:24:39,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1817/ 3125], loss: 0.556, per_step_time: 1413ms, lr: 4.8039815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:39,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.65992 samples/s/p 1:44:25 } +2024-07-30 04:24:42,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1819/ 3125], loss: 0.369, per_step_time: 1412ms, lr: 4.800529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:42,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.66226 samples/s/p 1:44:20 } +2024-07-30 04:24:44,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1821/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 4.797077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:44,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.66128 samples/s/p 1:44:18 } +2024-07-30 04:24:47,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1823/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 4.793624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:47,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.65912 samples/s/p 1:44:18 } +2024-07-30 04:24:50,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1825/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 4.7901726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:50,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.66054 samples/s/p 1:44:13 } +2024-07-30 04:24:53,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1827/ 3125], loss: 0.103, per_step_time: 1413ms, lr: 4.7867206e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:53,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.66020 samples/s/p 1:44:11 } +2024-07-30 04:24:56,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1829/ 3125], loss: 0.094, per_step_time: 1413ms, lr: 4.7832696e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:56,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.66067 samples/s/p 1:44:08 } +2024-07-30 04:24:59,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1831/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 4.779817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:59,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.65965 samples/s/p 1:44:06 } +2024-07-30 04:25:01,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1833/ 3125], loss: 0.329, per_step_time: 1412ms, lr: 4.776366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:01,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.66230 samples/s/p 1:44:00 } +2024-07-30 04:25:04,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1835/ 3125], loss: 0.141, per_step_time: 1413ms, lr: 4.772915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:04,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.66016 samples/s/p 1:44:00 } +2024-07-30 04:25:07,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1837/ 3125], loss: 0.406, per_step_time: 1413ms, lr: 4.769464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:07,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.65840 samples/s/p 1:43:59 } +2024-07-30 04:25:10,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1839/ 3125], loss: 0.384, per_step_time: 1413ms, lr: 4.766012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:10,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.66158 samples/s/p 1:43:52 } +2024-07-30 04:25:13,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1841/ 3125], loss: 0.415, per_step_time: 1413ms, lr: 4.762561e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:13,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.65963 samples/s/p 1:43:52 } +2024-07-30 04:25:16,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1843/ 3125], loss: 0.231, per_step_time: 1414ms, lr: 4.7591093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:16,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.65390 samples/s/p 1:43:55 } +2024-07-30 04:25:18,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1845/ 3125], loss: 0.663, per_step_time: 1414ms, lr: 4.755659e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:18,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.65389 samples/s/p 1:43:52 } +2024-07-30 04:25:21,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1847/ 3125], loss: 0.470, per_step_time: 1413ms, lr: 4.7522085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:21,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.66047 samples/s/p 1:43:42 } +2024-07-30 04:25:24,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1849/ 3125], loss: 0.412, per_step_time: 1414ms, lr: 4.748758e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:24,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.65668 samples/s/p 1:43:44 } +2024-07-30 04:25:27,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1851/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 4.7453073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:27,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.66158 samples/s/p 1:43:35 } +2024-07-30 04:25:30,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1853/ 3125], loss: 0.385, per_step_time: 1413ms, lr: 4.741856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:30,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.65832 samples/s/p 1:43:36 } +2024-07-30 04:25:33,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1855/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 4.738406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:33,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.66163 samples/s/p 1:43:30 } +2024-07-30 04:25:35,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1857/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 4.734956e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:35,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.66104 samples/s/p 1:43:28 } +2024-07-30 04:25:38,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1859/ 3125], loss: 0.089, per_step_time: 1415ms, lr: 4.731506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:38,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.65360 samples/s/p 1:43:33 } +2024-07-30 04:25:41,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1861/ 3125], loss: 0.364, per_step_time: 1414ms, lr: 4.728057e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:41,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.65711 samples/s/p 1:43:26 } +2024-07-30 04:25:44,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1863/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 4.7246062e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:44,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.66039 samples/s/p 1:43:20 } +2024-07-30 04:25:47,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1865/ 3125], loss: 0.362, per_step_time: 1414ms, lr: 4.721157e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:47,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.65686 samples/s/p 1:43:21 } +2024-07-30 04:25:50,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1867/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 4.717707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:50,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.66009 samples/s/p 1:43:14 } +2024-07-30 04:25:52,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1869/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 4.7142576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:52,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.66169 samples/s/p 1:43:10 } +2024-07-30 04:25:55,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1871/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 4.7108088e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:55,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.66032 samples/s/p 1:43:09 } +2024-07-30 04:25:58,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1873/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 4.70736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:58,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.66068 samples/s/p 1:43:05 } +2024-07-30 04:26:01,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1875/ 3125], loss: 0.180, per_step_time: 1412ms, lr: 4.7039107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:01,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.66329 samples/s/p 1:43:00 } +2024-07-30 04:26:04,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1877/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 4.700462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:04,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.66039 samples/s/p 1:43:00 } +2024-07-30 04:26:07,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1879/ 3125], loss: 0.197, per_step_time: 1413ms, lr: 4.6970135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:07,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.65961 samples/s/p 1:42:58 } +2024-07-30 04:26:09,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1881/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 4.6935643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:09,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.65932 samples/s/p 1:42:56 } +2024-07-30 04:26:12,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1883/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 4.690116e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:12,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.66059 samples/s/p 1:42:51 } +2024-07-30 04:26:15,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1885/ 3125], loss: 0.450, per_step_time: 1412ms, lr: 4.686668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:15,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.66311 samples/s/p 1:42:46 } +2024-07-30 04:26:18,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1887/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 4.6832197e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:18,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.65948 samples/s/p 1:42:47 } +2024-07-30 04:26:21,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1889/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 4.679772e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:21,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.65847 samples/s/p 1:42:45 } +2024-07-30 04:26:24,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1891/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 4.6763244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:24,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.65882 samples/s/p 1:42:42 } +2024-07-30 04:26:26,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1893/ 3125], loss: 0.161, per_step_time: 1414ms, lr: 4.672877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:26,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.65672 samples/s/p 1:42:41 } +2024-07-30 04:26:29,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1895/ 3125], loss: 0.257, per_step_time: 1412ms, lr: 4.6694286e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:29,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.66172 samples/s/p 1:42:33 } +2024-07-30 04:26:32,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1897/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 4.6659816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:32,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.66037 samples/s/p 1:42:32 } +2024-07-30 04:26:35,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1899/ 3125], loss: 0.394, per_step_time: 1413ms, lr: 4.662534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:35,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.65984 samples/s/p 1:42:30 } +2024-07-30 04:26:38,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1901/ 3125], loss: 0.136, per_step_time: 1412ms, lr: 4.659087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:38,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.66175 samples/s/p 1:42:25 } +2024-07-30 04:26:41,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1903/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 4.655641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:41,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.66075 samples/s/p 1:42:23 } +2024-07-30 04:26:43,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1905/ 3125], loss: 0.525, per_step_time: 1413ms, lr: 4.652194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:43,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.66126 samples/s/p 1:42:19 } +2024-07-30 04:26:46,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1907/ 3125], loss: 0.129, per_step_time: 1413ms, lr: 4.648748e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:46,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.66054 samples/s/p 1:42:17 } +2024-07-30 04:26:49,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1909/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 4.6453015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:49,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.65930 samples/s/p 1:42:16 } +2024-07-30 04:26:52,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1911/ 3125], loss: 0.398, per_step_time: 1412ms, lr: 4.6418545e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:52,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.66241 samples/s/p 1:42:10 } +2024-07-30 04:26:55,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1913/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 4.6384084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:55,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.66051 samples/s/p 1:42:09 } +2024-07-30 04:26:58,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1915/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 4.6349633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:58,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.66063 samples/s/p 1:42:06 } +2024-07-30 04:27:00,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1917/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 4.6315176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:00,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.66100 samples/s/p 1:42:03 } +2024-07-30 04:27:03,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1919/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 4.6280725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:03,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.65980 samples/s/p 1:42:01 } +2024-07-30 04:27:06,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1921/ 3125], loss: 0.118, per_step_time: 1413ms, lr: 4.624627e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:06,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.65832 samples/s/p 1:42:00 } +2024-07-30 04:27:09,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1923/ 3125], loss: 0.213, per_step_time: 1415ms, lr: 4.621182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:09,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.65359 samples/s/p 1:42:02 } +2024-07-30 04:27:12,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1925/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 4.617736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:12,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.65837 samples/s/p 1:41:54 } +2024-07-30 04:27:15,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1927/ 3125], loss: 0.150, per_step_time: 1414ms, lr: 4.614292e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:15,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.65725 samples/s/p 1:41:53 } +2024-07-30 04:27:17,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1929/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 4.6108476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:17,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.66034 samples/s/p 1:41:47 } +2024-07-30 04:27:20,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1931/ 3125], loss: 0.541, per_step_time: 1412ms, lr: 4.6074033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:20,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.66227 samples/s/p 1:41:42 } +2024-07-30 04:27:23,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1933/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 4.603959e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:23,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.65893 samples/s/p 1:41:42 } +2024-07-30 04:27:26,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1935/ 3125], loss: 0.469, per_step_time: 1413ms, lr: 4.6005152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:26,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.65845 samples/s/p 1:41:40 } +2024-07-30 04:27:29,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1937/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 4.5970714e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:29,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.65996 samples/s/p 1:41:36 } +2024-07-30 04:27:32,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1939/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 4.593627e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:32,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |███████████████████████████ | 5.66052 samples/s/p 1:41:32 } +2024-07-30 04:27:34,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1941/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 4.590184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:34,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |███████████████████████████ | 5.66067 samples/s/p 1:41:29 } +2024-07-30 04:27:37,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1943/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 4.586741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:37,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.65968 samples/s/p 1:41:27 } +2024-07-30 04:27:40,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1945/ 3125], loss: 0.203, per_step_time: 1414ms, lr: 4.5832976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:40,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.65504 samples/s/p 1:41:30 } +2024-07-30 04:27:43,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1947/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 4.579855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:43,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.66034 samples/s/p 1:41:21 } +2024-07-30 04:27:46,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1949/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 4.5764127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:46,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.65778 samples/s/p 1:41:21 } +2024-07-30 04:27:49,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1951/ 3125], loss: 0.128, per_step_time: 1414ms, lr: 4.5729703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:49,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.65701 samples/s/p 1:41:19 } +2024-07-30 04:27:51,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1953/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 4.5695274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:51,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.65925 samples/s/p 1:41:14 } +2024-07-30 04:27:54,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1955/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 4.5660854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:54,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.65827 samples/s/p 1:41:12 } +2024-07-30 04:27:57,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1957/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 4.5626434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:57,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.66040 samples/s/p 1:41:07 } +2024-07-30 04:28:00,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1959/ 3125], loss: 0.388, per_step_time: 1413ms, lr: 4.559202e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:00,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.65994 samples/s/p 1:41:05 } +2024-07-30 04:28:03,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1961/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 4.555761e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:03,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.66108 samples/s/p 1:41:01 } +2024-07-30 04:28:06,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1963/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 4.55232e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:06,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.66030 samples/s/p 1:40:59 } +2024-07-30 04:28:08,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1965/ 3125], loss: 0.447, per_step_time: 1413ms, lr: 4.5488787e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:08,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.66142 samples/s/p 1:40:55 } +2024-07-30 04:28:11,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1967/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 4.5454376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:11,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.66139 samples/s/p 1:40:52 } +2024-07-30 04:28:14,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1969/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 4.5419965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:14,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.65953 samples/s/p 1:40:51 } +2024-07-30 04:28:17,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1971/ 3125], loss: 0.551, per_step_time: 1413ms, lr: 4.538557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:17,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.65967 samples/s/p 1:40:48 } +2024-07-30 04:28:20,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1973/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 4.535117e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:20,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.66063 samples/s/p 1:40:44 } +2024-07-30 04:28:23,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1975/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 4.5316774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:23,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.65802 samples/s/p 1:40:44 } +2024-07-30 04:28:25,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1977/ 3125], loss: 0.380, per_step_time: 1413ms, lr: 4.5282372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:25,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.66015 samples/s/p 1:40:39 } +2024-07-30 04:28:28,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1979/ 3125], loss: 0.150, per_step_time: 1414ms, lr: 4.5247984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:28,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.65469 samples/s/p 1:40:42 } +2024-07-30 04:28:31,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1981/ 3125], loss: 0.378, per_step_time: 1412ms, lr: 4.521359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:31,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.66229 samples/s/p 1:40:31 } +2024-07-30 04:28:34,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1983/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 4.5179195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:34,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.66087 samples/s/p 1:40:30 } +2024-07-30 04:28:37,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1985/ 3125], loss: 0.598, per_step_time: 1413ms, lr: 4.5144807e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:37,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.65888 samples/s/p 1:40:29 } +2024-07-30 04:28:40,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1987/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 4.511043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:40,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.66142 samples/s/p 1:40:23 } +2024-07-30 04:28:42,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1989/ 3125], loss: 0.072, per_step_time: 1412ms, lr: 4.507604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:42,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.66327 samples/s/p 1:40:19 } +2024-07-30 04:28:45,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1991/ 3125], loss: 0.251, per_step_time: 1412ms, lr: 4.504166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:45,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.66320 samples/s/p 1:40:16 } +2024-07-30 04:28:48,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1993/ 3125], loss: 0.312, per_step_time: 1414ms, lr: 4.5007287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:48,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.65674 samples/s/p 1:40:20 } +2024-07-30 04:28:51,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1995/ 3125], loss: 0.250, per_step_time: 1412ms, lr: 4.4972912e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:51,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.66201 samples/s/p 1:40:12 } +2024-07-30 04:28:54,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1997/ 3125], loss: 0.273, per_step_time: 1414ms, lr: 4.493853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:54,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.65721 samples/s/p 1:40:14 } +2024-07-30 04:28:57,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1999/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 4.4904164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:57,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.65870 samples/s/p 1:40:09 } +2024-07-30 04:28:59,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2001/ 3125], loss: 0.130, per_step_time: 1413ms, lr: 4.486979e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:59,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.65924 samples/s/p 1:40:06 } +2024-07-30 04:29:02,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2003/ 3125], loss: 0.446, per_step_time: 1413ms, lr: 4.483543e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:02,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.66103 samples/s/p 1:40:01 } +2024-07-30 04:29:05,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2005/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 4.480107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:05,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.66022 samples/s/p 1:39:59 } +2024-07-30 04:29:08,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2007/ 3125], loss: 0.148, per_step_time: 1413ms, lr: 4.4766707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:08,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.66013 samples/s/p 1:39:57 } +2024-07-30 04:29:11,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2009/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 4.4732346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:11,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.66045 samples/s/p 1:39:53 } +2024-07-30 04:29:14,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2011/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 4.4697986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:14,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.65919 samples/s/p 1:39:52 } +2024-07-30 04:29:16,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2013/ 3125], loss: 0.226, per_step_time: 1414ms, lr: 4.466363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:16,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.65699 samples/s/p 1:39:51 } +2024-07-30 04:29:19,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2015/ 3125], loss: 0.189, per_step_time: 1412ms, lr: 4.4629282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:19,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.66196 samples/s/p 1:39:43 } +2024-07-30 04:29:22,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2017/ 3125], loss: 0.346, per_step_time: 1413ms, lr: 4.4594935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:22,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.65935 samples/s/p 1:39:43 } +2024-07-30 04:29:25,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2019/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 4.4560597e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:25,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.65785 samples/s/p 1:39:42 } +2024-07-30 04:29:28,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2021/ 3125], loss: 0.144, per_step_time: 1414ms, lr: 4.4526246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:28,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.65450 samples/s/p 1:39:43 } +2024-07-30 04:29:31,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2023/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 4.449191e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:31,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.65773 samples/s/p 1:39:36 } +2024-07-30 04:29:33,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2025/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 4.445756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:33,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.65483 samples/s/p 1:39:37 } +2024-07-30 04:29:36,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2027/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 4.442323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:36,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.65923 samples/s/p 1:39:29 } +2024-07-30 04:29:39,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2029/ 3125], loss: 0.114, per_step_time: 1425ms, lr: 4.4388903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:39,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.61392 samples/s/p 1:40:15 } +2024-07-30 04:29:42,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2031/ 3125], loss: 0.126, per_step_time: 1415ms, lr: 4.435457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:42,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.65276 samples/s/p 1:39:30 } +2024-07-30 04:29:45,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2033/ 3125], loss: 0.208, per_step_time: 1412ms, lr: 4.432024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:45,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.66223 samples/s/p 1:39:18 } +2024-07-30 04:29:48,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2035/ 3125], loss: 0.228, per_step_time: 1412ms, lr: 4.428592e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:48,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.66203 samples/s/p 1:39:15 } +2024-07-30 04:29:50,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2037/ 3125], loss: 0.384, per_step_time: 1413ms, lr: 4.42516e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:50,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.66078 samples/s/p 1:39:13 } +2024-07-30 04:29:53,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2039/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 4.4217286e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:53,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.66031 samples/s/p 1:39:11 } +2024-07-30 04:29:56,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2041/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 4.4182957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:56,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.66141 samples/s/p 1:39:07 } +2024-07-30 04:29:59,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2043/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 4.414865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:59,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.65823 samples/s/p 1:39:08 } +2024-07-30 04:30:02,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2045/ 3125], loss: 0.360, per_step_time: 1412ms, lr: 4.4114336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:02,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.66241 samples/s/p 1:39:00 } +2024-07-30 04:30:05,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2047/ 3125], loss: 0.136, per_step_time: 1413ms, lr: 4.408003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:05,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.65966 samples/s/p 1:39:00 } +2024-07-30 04:30:08,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2049/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 4.404573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:08,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.66019 samples/s/p 1:38:57 } +2024-07-30 04:30:10,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2051/ 3125], loss: 0.457, per_step_time: 1413ms, lr: 4.4011426e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:10,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.66111 samples/s/p 1:38:53 } +2024-07-30 04:30:13,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2053/ 3125], loss: 0.081, per_step_time: 1413ms, lr: 4.3977125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:13,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.66112 samples/s/p 1:38:50 } +2024-07-30 04:30:16,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2055/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 4.3942828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:16,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.66103 samples/s/p 1:38:48 } +2024-07-30 04:30:19,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2057/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 4.390853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:19,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.65969 samples/s/p 1:38:46 } +2024-07-30 04:30:22,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2059/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 4.387424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:22,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.66029 samples/s/p 1:38:43 } +2024-07-30 04:30:25,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2061/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 4.3839955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:25,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.65889 samples/s/p 1:38:42 } +2024-07-30 04:30:27,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2063/ 3125], loss: 0.240, per_step_time: 1414ms, lr: 4.380567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:27,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.65657 samples/s/p 1:38:41 } +2024-07-30 04:30:30,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2065/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 4.377139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:30,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.66086 samples/s/p 1:38:34 } +2024-07-30 04:30:33,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2067/ 3125], loss: 0.456, per_step_time: 1413ms, lr: 4.3737114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:33,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.65950 samples/s/p 1:38:32 } +2024-07-30 04:30:36,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2069/ 3125], loss: 0.345, per_step_time: 1412ms, lr: 4.3702826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:36,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.66193 samples/s/p 1:38:27 } +2024-07-30 04:30:39,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2071/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 4.3668556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:39,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.66135 samples/s/p 1:38:25 } +2024-07-30 04:30:42,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2073/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 4.3634286e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:42,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.65867 samples/s/p 1:38:25 } +2024-07-30 04:30:44,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2075/ 3125], loss: 0.453, per_step_time: 1413ms, lr: 4.3600025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:44,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.66037 samples/s/p 1:38:20 } +2024-07-30 04:30:47,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2077/ 3125], loss: 0.347, per_step_time: 1415ms, lr: 4.3565756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:47,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.65281 samples/s/p 1:38:25 } +2024-07-30 04:30:50,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2079/ 3125], loss: 0.239, per_step_time: 1414ms, lr: 4.35315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:50,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.65508 samples/s/p 1:38:20 } +2024-07-30 04:30:53,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2081/ 3125], loss: 0.294, per_step_time: 1414ms, lr: 4.3497243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:53,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.65674 samples/s/p 1:38:15 } +2024-07-30 04:30:56,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2083/ 3125], loss: 0.231, per_step_time: 1416ms, lr: 4.346298e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:56,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.64719 samples/s/p 1:38:23 } +2024-07-30 04:30:59,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2085/ 3125], loss: 0.124, per_step_time: 1413ms, lr: 4.342873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:59,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.65993 samples/s/p 1:38:06 } +2024-07-30 04:31:01,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2087/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 4.339449e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:01,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.66148 samples/s/p 1:38:02 } +2024-07-30 04:31:04,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2089/ 3125], loss: 0.176, per_step_time: 1412ms, lr: 4.3360237e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:04,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.66206 samples/s/p 1:37:59 } +2024-07-30 04:31:07,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2091/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 4.3326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:07,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.66170 samples/s/p 1:37:56 } +2024-07-30 04:31:10,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2093/ 3125], loss: 0.243, per_step_time: 1412ms, lr: 4.329176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:10,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.66181 samples/s/p 1:37:53 } +2024-07-30 04:31:13,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2095/ 3125], loss: 0.234, per_step_time: 1412ms, lr: 4.3257533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:13,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.66190 samples/s/p 1:37:50 } +2024-07-30 04:31:16,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2097/ 3125], loss: 0.252, per_step_time: 1412ms, lr: 4.3223286e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:16,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.66213 samples/s/p 1:37:47 } +2024-07-30 04:31:18,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2099/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 4.318906e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:18,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.66056 samples/s/p 1:37:46 } +2024-07-30 04:31:21,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2101/ 3125], loss: 0.409, per_step_time: 1412ms, lr: 4.3154832e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:21,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.66291 samples/s/p 1:37:41 } +2024-07-30 04:31:24,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2103/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 4.3120613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:24,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.66049 samples/s/p 1:37:40 } +2024-07-30 04:31:27,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2105/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 4.3086397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:27,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.66048 samples/s/p 1:37:38 } +2024-07-30 04:31:30,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2107/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 4.305218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:30,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.66067 samples/s/p 1:37:35 } +2024-07-30 04:31:33,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2109/ 3125], loss: 0.384, per_step_time: 1413ms, lr: 4.3017967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:33,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.65836 samples/s/p 1:37:34 } +2024-07-30 04:31:35,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2111/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 4.298376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:35,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.66116 samples/s/p 1:37:28 } +2024-07-30 04:31:38,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2113/ 3125], loss: 0.296, per_step_time: 1414ms, lr: 4.2949546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:38,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.65709 samples/s/p 1:37:30 } +2024-07-30 04:31:41,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2115/ 3125], loss: 0.449, per_step_time: 1413ms, lr: 4.2915344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:41,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.66157 samples/s/p 1:37:22 } +2024-07-30 04:31:44,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2117/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 4.2881147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:44,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.65859 samples/s/p 1:37:23 } +2024-07-30 04:31:47,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2119/ 3125], loss: 0.334, per_step_time: 1413ms, lr: 4.2846955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:47,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.66087 samples/s/p 1:37:17 } +2024-07-30 04:31:50,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2121/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 4.281276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:50,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |███████████████████████████ | 5.66081 samples/s/p 1:37:15 } +2024-07-30 04:31:52,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2123/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 4.2778574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:52,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |███████████████████████████ | 5.65962 samples/s/p 1:37:13 } +2024-07-30 04:31:55,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2125/ 3125], loss: 0.325, per_step_time: 1414ms, lr: 4.274439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:55,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.65730 samples/s/p 1:37:13 } +2024-07-30 04:31:58,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2127/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 4.27102e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:58,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.66044 samples/s/p 1:37:07 } +2024-07-30 04:32:01,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2129/ 3125], loss: 0.390, per_step_time: 1413ms, lr: 4.2676024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:01,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.65900 samples/s/p 1:37:05 } +2024-07-30 04:32:04,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2131/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 4.264185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:04,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.66079 samples/s/p 1:37:01 } +2024-07-30 04:32:07,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2133/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 4.2607676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:07,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.66021 samples/s/p 1:36:58 } +2024-07-30 04:32:09,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2135/ 3125], loss: 0.208, per_step_time: 1412ms, lr: 4.257351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:09,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.66284 samples/s/p 1:36:53 } +2024-07-30 04:32:12,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2137/ 3125], loss: 0.383, per_step_time: 1414ms, lr: 4.253935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:12,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.65766 samples/s/p 1:36:55 } +2024-07-30 04:32:15,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2139/ 3125], loss: 0.202, per_step_time: 1415ms, lr: 4.250519e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:15,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.65331 samples/s/p 1:36:57 } +2024-07-30 04:32:18,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2141/ 3125], loss: 0.498, per_step_time: 1413ms, lr: 4.2471024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:18,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.66052 samples/s/p 1:36:47 } +2024-07-30 04:32:21,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2143/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 4.2436873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:21,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.65797 samples/s/p 1:36:47 } +2024-07-30 04:32:24,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2145/ 3125], loss: 0.457, per_step_time: 1414ms, lr: 4.240272e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:24,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.65673 samples/s/p 1:36:45 } +2024-07-30 04:32:26,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2147/ 3125], loss: 0.206, per_step_time: 1414ms, lr: 4.2368574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:26,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.65615 samples/s/p 1:36:43 } +2024-07-30 04:32:29,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2149/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 4.2334436e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:29,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.66080 samples/s/p 1:36:35 } +2024-07-30 04:32:32,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2151/ 3125], loss: 0.194, per_step_time: 1414ms, lr: 4.23003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:32,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.65575 samples/s/p 1:36:37 } +2024-07-30 04:32:35,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2153/ 3125], loss: 0.188, per_step_time: 1414ms, lr: 4.226616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:35,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.65741 samples/s/p 1:36:33 } +2024-07-30 04:32:38,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2155/ 3125], loss: 0.256, per_step_time: 1418ms, lr: 4.2232023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:38,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.63884 samples/s/p 1:36:49 } +2024-07-30 04:32:41,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2157/ 3125], loss: 0.396, per_step_time: 1414ms, lr: 4.2197894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:41,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.65557 samples/s/p 1:36:29 } +2024-07-30 04:32:43,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2159/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 4.216377e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:43,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.65925 samples/s/p 1:36:23 } +2024-07-30 04:32:46,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2161/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 4.2129655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:46,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.65974 samples/s/p 1:36:19 } +2024-07-30 04:32:49,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2163/ 3125], loss: 0.292, per_step_time: 1414ms, lr: 4.209554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:49,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.65761 samples/s/p 1:36:19 } +2024-07-30 04:32:52,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2165/ 3125], loss: 0.289, per_step_time: 1412ms, lr: 4.2061424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:52,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.66176 samples/s/p 1:36:12 } +2024-07-30 04:32:55,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2167/ 3125], loss: 0.211, per_step_time: 1414ms, lr: 4.2027314e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:55,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.65500 samples/s/p 1:36:16 } +2024-07-30 04:32:58,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2169/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 4.19932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:58,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.66116 samples/s/p 1:36:07 } +2024-07-30 04:33:00,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2171/ 3125], loss: 0.269, per_step_time: 1412ms, lr: 4.19591e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:00,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.66210 samples/s/p 1:36:03 } +2024-07-30 04:33:03,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2173/ 3125], loss: 0.463, per_step_time: 1413ms, lr: 4.1925005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:03,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.66013 samples/s/p 1:36:02 } +2024-07-30 04:33:06,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2175/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 4.1890917e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:06,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.66019 samples/s/p 1:35:59 } +2024-07-30 04:33:09,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2177/ 3125], loss: 0.359, per_step_time: 1412ms, lr: 4.185682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:09,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.66196 samples/s/p 1:35:54 } +2024-07-30 04:33:12,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2179/ 3125], loss: 0.340, per_step_time: 1412ms, lr: 4.1822736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:12,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.66199 samples/s/p 1:35:52 } +2024-07-30 04:33:15,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2181/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 4.1788658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:15,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.65988 samples/s/p 1:35:51 } +2024-07-30 04:33:17,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2183/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 4.1754583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:17,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.66020 samples/s/p 1:35:48 } +2024-07-30 04:33:20,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2185/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 4.1720496e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:20,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.66099 samples/s/p 1:35:44 } +2024-07-30 04:33:23,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2187/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 4.168643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:23,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.65840 samples/s/p 1:35:44 } +2024-07-30 04:33:26,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2189/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 4.165236e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:26,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.65939 samples/s/p 1:35:40 } +2024-07-30 04:33:29,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2191/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 4.16183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:29,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.66140 samples/s/p 1:35:35 } +2024-07-30 04:33:32,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2193/ 3125], loss: 0.481, per_step_time: 1413ms, lr: 4.1584244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:32,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.65947 samples/s/p 1:35:34 } +2024-07-30 04:33:34,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2195/ 3125], loss: 0.492, per_step_time: 1414ms, lr: 4.1550193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:34,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.65596 samples/s/p 1:35:35 } +2024-07-30 04:33:37,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2197/ 3125], loss: 0.273, per_step_time: 1415ms, lr: 4.1516146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:37,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.65223 samples/s/p 1:35:36 } +2024-07-30 04:33:40,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2199/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 4.148209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:40,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.65830 samples/s/p 1:35:27 } +2024-07-30 04:33:43,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2201/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 4.1448043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:43,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.65897 samples/s/p 1:35:24 } +2024-07-30 04:33:46,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2203/ 3125], loss: 0.338, per_step_time: 1412ms, lr: 4.141401e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:46,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.66179 samples/s/p 1:35:18 } +2024-07-30 04:33:49,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2205/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 4.1379976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:49,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.66018 samples/s/p 1:35:17 } +2024-07-30 04:33:51,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2207/ 3125], loss: 0.235, per_step_time: 1413ms, lr: 4.1345947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:51,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.66140 samples/s/p 1:35:13 } +2024-07-30 04:33:54,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2209/ 3125], loss: 0.401, per_step_time: 1413ms, lr: 4.131192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:54,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.66118 samples/s/p 1:35:10 } +2024-07-30 04:33:57,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2211/ 3125], loss: 0.233, per_step_time: 1412ms, lr: 4.12779e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:57,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.66285 samples/s/p 1:35:05 } +2024-07-30 04:34:00,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2213/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 4.1243875e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:00,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.66081 samples/s/p 1:35:05 } +2024-07-30 04:34:03,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2215/ 3125], loss: 0.232, per_step_time: 1412ms, lr: 4.1209864e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:03,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.66309 samples/s/p 1:35:00 } +2024-07-30 04:34:06,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2217/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 4.117586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:06,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.66046 samples/s/p 1:34:59 } +2024-07-30 04:34:08,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2219/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 4.1141857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:08,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.66032 samples/s/p 1:34:57 } +2024-07-30 04:34:11,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2221/ 3125], loss: 0.216, per_step_time: 1412ms, lr: 4.110785e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:11,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.66219 samples/s/p 1:34:52 } +2024-07-30 04:34:14,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2223/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 4.1073854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:14,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.65814 samples/s/p 1:34:53 } +2024-07-30 04:34:17,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2225/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 4.1039866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:17,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.65773 samples/s/p 1:34:51 } +2024-07-30 04:34:20,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2227/ 3125], loss: 0.265, per_step_time: 1414ms, lr: 4.1005865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:20,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.65476 samples/s/p 1:34:51 } +2024-07-30 04:34:23,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2229/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 4.0971886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:23,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.65894 samples/s/p 1:34:44 } +2024-07-30 04:34:25,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2231/ 3125], loss: 0.579, per_step_time: 1413ms, lr: 4.093791e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:25,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.66139 samples/s/p 1:34:39 } +2024-07-30 04:34:28,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2233/ 3125], loss: 0.166, per_step_time: 1414ms, lr: 4.0903933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:28,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.65702 samples/s/p 1:34:40 } +2024-07-30 04:34:31,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2235/ 3125], loss: 0.143, per_step_time: 1412ms, lr: 4.0869963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:31,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.66174 samples/s/p 1:34:33 } +2024-07-30 04:34:34,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2237/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 4.0836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:34,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.65926 samples/s/p 1:34:32 } +2024-07-30 04:34:37,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2239/ 3125], loss: 0.324, per_step_time: 1414ms, lr: 4.080204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:37,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.65419 samples/s/p 1:34:35 } +2024-07-30 04:34:40,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2241/ 3125], loss: 0.142, per_step_time: 1412ms, lr: 4.0768073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:40,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.66289 samples/s/p 1:34:23 } +2024-07-30 04:34:42,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2243/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 4.073412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:42,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.66011 samples/s/p 1:34:23 } +2024-07-30 04:34:45,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2245/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 4.070017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:45,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.65997 samples/s/p 1:34:20 } +2024-07-30 04:34:48,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2247/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 4.0666228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:48,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.65650 samples/s/p 1:34:21 } +2024-07-30 04:34:51,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2249/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 4.063229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:51,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.65820 samples/s/p 1:34:16 } +2024-07-30 04:34:54,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2251/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 4.0598356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:54,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.65811 samples/s/p 1:34:14 } +2024-07-30 04:34:57,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2253/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 4.056443e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:57,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.66069 samples/s/p 1:34:08 } +2024-07-30 04:34:59,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2255/ 3125], loss: 0.197, per_step_time: 1413ms, lr: 4.0530504e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:59,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.65831 samples/s/p 1:34:08 } +2024-07-30 04:35:02,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2257/ 3125], loss: 0.380, per_step_time: 1414ms, lr: 4.049657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:02,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.65663 samples/s/p 1:34:07 } +2024-07-30 04:35:05,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2259/ 3125], loss: 0.338, per_step_time: 1414ms, lr: 4.0462655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:05,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.65417 samples/s/p 1:34:06 } +2024-07-30 04:35:08,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2261/ 3125], loss: 0.310, per_step_time: 1412ms, lr: 4.0428745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:08,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.66191 samples/s/p 1:33:56 } +2024-07-30 04:35:11,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2263/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 4.039484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:11,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.66000 samples/s/p 1:33:55 } +2024-07-30 04:35:14,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2265/ 3125], loss: 0.197, per_step_time: 1412ms, lr: 4.0360937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:14,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.66269 samples/s/p 1:33:49 } +2024-07-30 04:35:16,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2267/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 4.0327036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:16,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.65907 samples/s/p 1:33:50 } +2024-07-30 04:35:19,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2269/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 4.0293144e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:19,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.65914 samples/s/p 1:33:47 } +2024-07-30 04:35:22,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2271/ 3125], loss: 0.302, per_step_time: 1412ms, lr: 4.025924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:22,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.66360 samples/s/p 1:33:40 } +2024-07-30 04:35:25,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2273/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 4.0225364e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:25,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.66038 samples/s/p 1:33:40 } +2024-07-30 04:35:28,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2275/ 3125], loss: 0.459, per_step_time: 1412ms, lr: 4.019148e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:28,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.66209 samples/s/p 1:33:36 } +2024-07-30 04:35:31,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2277/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 4.015761e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:31,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.66041 samples/s/p 1:33:35 } +2024-07-30 04:35:33,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2279/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 4.0123737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:33,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.66061 samples/s/p 1:33:32 } +2024-07-30 04:35:36,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2281/ 3125], loss: 0.136, per_step_time: 1412ms, lr: 4.008987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:36,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.66253 samples/s/p 1:33:27 } +2024-07-30 04:35:39,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2283/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 4.005601e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:39,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.65886 samples/s/p 1:33:28 } +2024-07-30 04:35:42,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2285/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 4.0022146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:42,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.66157 samples/s/p 1:33:22 } +2024-07-30 04:35:45,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2287/ 3125], loss: 0.440, per_step_time: 1413ms, lr: 3.9988295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:45,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.66104 samples/s/p 1:33:20 } +2024-07-30 04:35:48,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2289/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 3.9954452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:48,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.66026 samples/s/p 1:33:18 } +2024-07-30 04:35:50,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2291/ 3125], loss: 0.377, per_step_time: 1412ms, lr: 3.9920606e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:50,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.66292 samples/s/p 1:33:12 } +2024-07-30 04:35:53,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2293/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 3.9886772e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:53,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.65681 samples/s/p 1:33:16 } +2024-07-30 04:35:56,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2295/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 3.985294e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:56,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.65959 samples/s/p 1:33:10 } +2024-07-30 04:35:59,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2297/ 3125], loss: 0.109, per_step_time: 1414ms, lr: 3.9819115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:59,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.65764 samples/s/p 1:33:09 } +2024-07-30 04:36:02,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2299/ 3125], loss: 0.496, per_step_time: 1413ms, lr: 3.978528e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:02,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.65851 samples/s/p 1:33:05 } +2024-07-30 04:36:05,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2301/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 3.9751467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:05,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.65840 samples/s/p 1:33:03 } +2024-07-30 04:36:07,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2303/ 3125], loss: 0.450, per_step_time: 1414ms, lr: 3.9717647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:07,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.65551 samples/s/p 1:33:03 } +2024-07-30 04:36:10,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2305/ 3125], loss: 0.127, per_step_time: 1414ms, lr: 3.9683846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:10,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.65753 samples/s/p 1:32:58 } +2024-07-30 04:36:13,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2307/ 3125], loss: 0.341, per_step_time: 1413ms, lr: 3.9650045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:13,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.66043 samples/s/p 1:32:52 } +2024-07-30 04:36:16,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2309/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 3.9616248e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:16,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |████████████████████████████ | 5.66133 samples/s/p 1:32:49 } +2024-07-30 04:36:19,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2311/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 3.958245e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:19,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |████████████████████████████ | 5.66020 samples/s/p 1:32:47 } +2024-07-30 04:36:22,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2313/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 3.9548663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:22,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.66050 samples/s/p 1:32:44 } +2024-07-30 04:36:24,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2315/ 3125], loss: 0.234, per_step_time: 1412ms, lr: 3.951487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:24,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.66276 samples/s/p 1:32:39 } +2024-07-30 04:36:27,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2317/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 3.9481097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:27,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.66035 samples/s/p 1:32:38 } +2024-07-30 04:36:30,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2319/ 3125], loss: 0.322, per_step_time: 1413ms, lr: 3.9447323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:30,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.66034 samples/s/p 1:32:35 } +2024-07-30 04:36:33,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2321/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 3.9413558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:33,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.66121 samples/s/p 1:32:32 } +2024-07-30 04:36:36,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2323/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 3.9379793e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:36,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.66018 samples/s/p 1:32:30 } +2024-07-30 04:36:39,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2325/ 3125], loss: 0.107, per_step_time: 1412ms, lr: 3.9346037e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:39,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.66257 samples/s/p 1:32:25 } +2024-07-30 04:36:41,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2327/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 3.9312285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:41,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.65991 samples/s/p 1:32:24 } +2024-07-30 04:36:44,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2329/ 3125], loss: 0.462, per_step_time: 1413ms, lr: 3.9278525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:44,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.66123 samples/s/p 1:32:20 } +2024-07-30 04:36:47,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2331/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 3.9244787e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:47,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.66091 samples/s/p 1:32:18 } +2024-07-30 04:36:50,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2333/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 3.921105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:50,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.65939 samples/s/p 1:32:16 } +2024-07-30 04:36:53,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2335/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 3.9177316e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:53,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.65910 samples/s/p 1:32:14 } +2024-07-30 04:36:56,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2337/ 3125], loss: 0.206, per_step_time: 1417ms, lr: 3.914359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:56,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.64367 samples/s/p 1:32:26 } +2024-07-30 04:36:58,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2339/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 3.910987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:58,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.65917 samples/s/p 1:32:08 } +2024-07-30 04:37:01,807 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2341/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 3.9076153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:01,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.65830 samples/s/p 1:32:06 } +2024-07-30 04:37:04,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2343/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 3.9042434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:04,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.65821 samples/s/p 1:32:04 } +2024-07-30 04:37:07,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2345/ 3125], loss: 0.082, per_step_time: 1413ms, lr: 3.900873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:07,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.65981 samples/s/p 1:31:59 } +2024-07-30 04:37:10,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2347/ 3125], loss: 0.097, per_step_time: 1413ms, lr: 3.897502e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:10,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.65925 samples/s/p 1:31:57 } +2024-07-30 04:37:13,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2349/ 3125], loss: 0.252, per_step_time: 1412ms, lr: 3.894133e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:13,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.66265 samples/s/p 1:31:51 } +2024-07-30 04:37:15,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2351/ 3125], loss: 0.183, per_step_time: 1414ms, lr: 3.890764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:15,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.65709 samples/s/p 1:31:53 } +2024-07-30 04:37:18,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2353/ 3125], loss: 0.421, per_step_time: 1413ms, lr: 3.887396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:18,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.65963 samples/s/p 1:31:48 } +2024-07-30 04:37:21,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2355/ 3125], loss: 0.323, per_step_time: 1412ms, lr: 3.8840276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:21,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.66371 samples/s/p 1:31:41 } +2024-07-30 04:37:24,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2357/ 3125], loss: 0.412, per_step_time: 1414ms, lr: 3.8806597e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:24,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.65545 samples/s/p 1:31:46 } +2024-07-30 04:37:27,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2359/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 3.8772923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:27,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.66051 samples/s/p 1:31:39 } +2024-07-30 04:37:30,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2361/ 3125], loss: 0.202, per_step_time: 1414ms, lr: 3.873926e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:30,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.65709 samples/s/p 1:31:39 } +2024-07-30 04:37:32,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2363/ 3125], loss: 0.151, per_step_time: 1415ms, lr: 3.8705602e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:32,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.65335 samples/s/p 1:31:40 } +2024-07-30 04:37:35,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2365/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 3.867195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:35,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.65810 samples/s/p 1:31:33 } +2024-07-30 04:37:38,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2367/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 3.86383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:38,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.65962 samples/s/p 1:31:28 } +2024-07-30 04:37:41,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2369/ 3125], loss: 0.330, per_step_time: 1415ms, lr: 3.8604658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:41,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.65218 samples/s/p 1:31:33 } +2024-07-30 04:37:44,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2371/ 3125], loss: 0.040, per_step_time: 1414ms, lr: 3.8571015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:44,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.65636 samples/s/p 1:31:26 } +2024-07-30 04:37:47,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2373/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 3.8537382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:47,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.66132 samples/s/p 1:31:18 } +2024-07-30 04:37:49,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2375/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 3.850376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:49,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.65918 samples/s/p 1:31:17 } +2024-07-30 04:37:52,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2377/ 3125], loss: 0.421, per_step_time: 1413ms, lr: 3.8470143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:52,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.66008 samples/s/p 1:31:14 } +2024-07-30 04:37:55,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2379/ 3125], loss: 0.048, per_step_time: 1413ms, lr: 3.8436524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:55,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.66126 samples/s/p 1:31:10 } +2024-07-30 04:37:58,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2381/ 3125], loss: 0.364, per_step_time: 1416ms, lr: 3.8402914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:58,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.64690 samples/s/p 1:31:21 } +2024-07-30 04:38:01,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2383/ 3125], loss: 0.176, per_step_time: 1413ms, lr: 3.8369312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:01,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.65867 samples/s/p 1:31:07 } +2024-07-30 04:38:04,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2385/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 3.8335716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:04,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.65961 samples/s/p 1:31:03 } +2024-07-30 04:38:07,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2387/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 3.8302114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:07,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.66016 samples/s/p 1:30:59 } +2024-07-30 04:38:09,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2389/ 3125], loss: 0.256, per_step_time: 1412ms, lr: 3.826853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:09,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.66236 samples/s/p 1:30:54 } +2024-07-30 04:38:12,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2391/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 3.8234944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:12,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.66080 samples/s/p 1:30:53 } +2024-07-30 04:38:15,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2393/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 3.820137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:15,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.65895 samples/s/p 1:30:52 } +2024-07-30 04:38:18,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2395/ 3125], loss: 0.094, per_step_time: 1413ms, lr: 3.81678e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:18,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.65930 samples/s/p 1:30:49 } +2024-07-30 04:38:21,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2397/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 3.8134237e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:21,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.66075 samples/s/p 1:30:45 } +2024-07-30 04:38:24,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2399/ 3125], loss: 0.156, per_step_time: 1414ms, lr: 3.8100677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:24,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.65381 samples/s/p 1:30:49 } +2024-07-30 04:38:26,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2401/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 3.806712e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:26,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.66062 samples/s/p 1:30:39 } +2024-07-30 04:38:29,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2403/ 3125], loss: 0.595, per_step_time: 1413ms, lr: 3.8033568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:29,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.65936 samples/s/p 1:30:38 } +2024-07-30 04:38:32,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2405/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 3.8000028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:32,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.65887 samples/s/p 1:30:35 } +2024-07-30 04:38:35,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2407/ 3125], loss: 0.425, per_step_time: 1414ms, lr: 3.7966493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:35,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.65657 samples/s/p 1:30:35 } +2024-07-30 04:38:38,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2409/ 3125], loss: 0.322, per_step_time: 1414ms, lr: 3.7932964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:38,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.65752 samples/s/p 1:30:31 } +2024-07-30 04:38:41,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2411/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 3.7899433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:41,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.65843 samples/s/p 1:30:27 } +2024-07-30 04:38:43,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2413/ 3125], loss: 0.084, per_step_time: 1413ms, lr: 3.7865918e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:43,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.66091 samples/s/p 1:30:22 } +2024-07-30 04:38:46,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2415/ 3125], loss: 0.307, per_step_time: 1412ms, lr: 3.7832397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:46,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.66178 samples/s/p 1:30:18 } +2024-07-30 04:38:49,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2417/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 3.7798889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:49,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.66002 samples/s/p 1:30:17 } +2024-07-30 04:38:52,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2419/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 3.7765392e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:52,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.65886 samples/s/p 1:30:15 } +2024-07-30 04:38:55,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2421/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 3.7731897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:55,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.66009 samples/s/p 1:30:11 } +2024-07-30 04:38:58,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2423/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 3.7698403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:58,022 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.65896 samples/s/p 1:30:10 } +2024-07-30 04:39:00,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2425/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 3.7664922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:00,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.66071 samples/s/p 1:30:05 } +2024-07-30 04:39:03,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2427/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 3.7631446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:03,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.65918 samples/s/p 1:30:04 } +2024-07-30 04:39:06,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2429/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 3.7597963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:06,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.66003 samples/s/p 1:30:00 } +2024-07-30 04:39:09,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2431/ 3125], loss: 0.176, per_step_time: 1413ms, lr: 3.7564498e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:09,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.65915 samples/s/p 1:29:58 } +2024-07-30 04:39:12,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2433/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 3.753104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:12,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.65913 samples/s/p 1:29:55 } +2024-07-30 04:39:15,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2435/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 3.7497582e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:15,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.65972 samples/s/p 1:29:52 } +2024-07-30 04:39:17,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2437/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 3.7464135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:17,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.65991 samples/s/p 1:29:49 } +2024-07-30 04:39:20,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2439/ 3125], loss: 0.328, per_step_time: 1415ms, lr: 3.7430698e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:20,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.65212 samples/s/p 1:29:54 } +2024-07-30 04:39:23,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2441/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 3.7397258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:23,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.65913 samples/s/p 1:29:44 } +2024-07-30 04:39:26,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2443/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 3.736382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:26,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.66009 samples/s/p 1:29:40 } +2024-07-30 04:39:29,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2445/ 3125], loss: 0.225, per_step_time: 1414ms, lr: 3.73304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:29,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.65680 samples/s/p 1:29:41 } +2024-07-30 04:39:32,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2447/ 3125], loss: 0.306, per_step_time: 1415ms, lr: 3.7296977e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:32,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.65235 samples/s/p 1:29:42 } +2024-07-30 04:39:34,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2449/ 3125], loss: 0.268, per_step_time: 1413ms, lr: 3.7263565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:34,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.65815 samples/s/p 1:29:34 } +2024-07-30 04:39:37,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2451/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 3.7230163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:37,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.65987 samples/s/p 1:29:29 } +2024-07-30 04:39:40,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2453/ 3125], loss: 0.315, per_step_time: 1414ms, lr: 3.7196764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:40,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.65759 samples/s/p 1:29:29 } +2024-07-30 04:39:43,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2455/ 3125], loss: 0.526, per_step_time: 1413ms, lr: 3.7163363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:43,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.66002 samples/s/p 1:29:23 } +2024-07-30 04:39:46,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2457/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 3.712998e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:46,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.66041 samples/s/p 1:29:20 } +2024-07-30 04:39:49,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2459/ 3125], loss: 0.221, per_step_time: 1412ms, lr: 3.7096588e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:49,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.66202 samples/s/p 1:29:16 } +2024-07-30 04:39:51,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2461/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 3.7063216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:51,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.66091 samples/s/p 1:29:14 } +2024-07-30 04:39:54,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2463/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 3.7029847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:54,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.65986 samples/s/p 1:29:12 } +2024-07-30 04:39:57,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2465/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 3.6996487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:57,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.66100 samples/s/p 1:29:08 } +2024-07-30 04:40:00,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2467/ 3125], loss: 0.109, per_step_time: 1413ms, lr: 3.6963124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:00,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.65916 samples/s/p 1:29:07 } +2024-07-30 04:40:03,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2469/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 3.6929775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:03,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.66125 samples/s/p 1:29:02 } +2024-07-30 04:40:06,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2471/ 3125], loss: 0.391, per_step_time: 1413ms, lr: 3.6896433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:06,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.66078 samples/s/p 1:29:00 } +2024-07-30 04:40:08,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2473/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 3.6863087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:08,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.66017 samples/s/p 1:28:58 } +2024-07-30 04:40:11,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2475/ 3125], loss: 0.343, per_step_time: 1412ms, lr: 3.6829756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:11,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.66260 samples/s/p 1:28:53 } +2024-07-30 04:40:11,713 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 04:40:46,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2477/ 3125], loss: 0.064, per_step_time: 2882ms, lr: 3.6796432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:46,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 2.77583 samples/s/p 3:01:13 } +2024-07-30 04:40:49,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2479/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 3.676311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:49,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.65859 samples/s/p 1:28:51 } +2024-07-30 04:40:51,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2481/ 3125], loss: 0.274, per_step_time: 1412ms, lr: 3.67298e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:51,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.66195 samples/s/p 1:28:45 } +2024-07-30 04:40:54,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2483/ 3125], loss: 0.118, per_step_time: 1413ms, lr: 3.6696492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:54,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.66085 samples/s/p 1:28:43 } +2024-07-30 04:40:57,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2485/ 3125], loss: 0.181, per_step_time: 1415ms, lr: 3.6663198e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:57,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.64989 samples/s/p 1:28:51 } +2024-07-30 04:41:00,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2487/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 3.662989e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:00,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.65923 samples/s/p 1:28:39 } +2024-07-30 04:41:03,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2489/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 3.6596607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:03,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.66160 samples/s/p 1:28:34 } +2024-07-30 04:41:06,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2491/ 3125], loss: 0.308, per_step_time: 1415ms, lr: 3.6563322e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:06,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.65014 samples/s/p 1:28:42 } +2024-07-30 04:41:08,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2493/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 3.6530046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:08,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.65873 samples/s/p 1:28:31 } +2024-07-30 04:41:11,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2495/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 3.649678e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:11,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.65919 samples/s/p 1:28:28 } +2024-07-30 04:41:14,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2497/ 3125], loss: 0.399, per_step_time: 1416ms, lr: 3.6463523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:14,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |█████████████████████████████ | 5.64953 samples/s/p 1:28:34 } +2024-07-30 04:41:17,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2499/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 3.6430263e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:17,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |█████████████████████████████ | 5.65908 samples/s/p 1:28:22 } +2024-07-30 04:41:20,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2501/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 3.639701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:20,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.65970 samples/s/p 1:28:19 } +2024-07-30 04:41:23,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2503/ 3125], loss: 0.176, per_step_time: 1414ms, lr: 3.6363765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:23,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.65759 samples/s/p 1:28:18 } +2024-07-30 04:41:25,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2505/ 3125], loss: 0.574, per_step_time: 1424ms, lr: 3.633053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:25,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.61630 samples/s/p 1:28:54 } +2024-07-30 04:41:28,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2507/ 3125], loss: 0.181, per_step_time: 1415ms, lr: 3.6297301e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:28,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.65262 samples/s/p 1:28:17 } +2024-07-30 04:41:31,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2509/ 3125], loss: 0.202, per_step_time: 1414ms, lr: 3.6264082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:31,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.65658 samples/s/p 1:28:10 } +2024-07-30 04:41:34,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2511/ 3125], loss: 0.570, per_step_time: 1414ms, lr: 3.623086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:34,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.65586 samples/s/p 1:28:08 } +2024-07-30 04:41:37,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2513/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 3.6197655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:37,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.66157 samples/s/p 1:28:00 } +2024-07-30 04:41:40,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2515/ 3125], loss: 0.619, per_step_time: 1413ms, lr: 3.616444e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:40,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.65903 samples/s/p 1:28:00 } +2024-07-30 04:41:42,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2517/ 3125], loss: 0.422, per_step_time: 1414ms, lr: 3.6131246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:42,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.65508 samples/s/p 1:28:00 } +2024-07-30 04:41:45,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2519/ 3125], loss: 0.370, per_step_time: 1414ms, lr: 3.6098056e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:45,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.65625 samples/s/p 1:27:56 } +2024-07-30 04:41:48,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2521/ 3125], loss: 0.499, per_step_time: 1413ms, lr: 3.6064878e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:48,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.66052 samples/s/p 1:27:50 } +2024-07-30 04:41:51,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2523/ 3125], loss: 0.164, per_step_time: 1429ms, lr: 3.6031697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:51,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.59683 samples/s/p 1:28:47 } +2024-07-30 04:41:54,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2525/ 3125], loss: 0.048, per_step_time: 1413ms, lr: 3.5998528e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:54,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.66150 samples/s/p 1:27:43 } +2024-07-30 04:41:57,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2527/ 3125], loss: 0.453, per_step_time: 1414ms, lr: 3.5965368e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:57,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.65564 samples/s/p 1:27:46 } +2024-07-30 04:42:00,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2529/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 3.5932212e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:00,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.65830 samples/s/p 1:27:40 } +2024-07-30 04:42:02,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2531/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 3.5899054e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:02,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.66029 samples/s/p 1:27:36 } +2024-07-30 04:42:05,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2533/ 3125], loss: 0.200, per_step_time: 1414ms, lr: 3.5865914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:05,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.65542 samples/s/p 1:27:37 } +2024-07-30 04:42:08,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2535/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 3.5832775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:08,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.65944 samples/s/p 1:27:31 } +2024-07-30 04:42:11,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2537/ 3125], loss: 0.054, per_step_time: 1414ms, lr: 3.5799646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:11,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.65767 samples/s/p 1:27:30 } +2024-07-30 04:42:14,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2539/ 3125], loss: 0.462, per_step_time: 1413ms, lr: 3.5766523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:14,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.65917 samples/s/p 1:27:25 } +2024-07-30 04:42:17,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2541/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 3.573341e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:17,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.65957 samples/s/p 1:27:22 } +2024-07-30 04:42:19,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2543/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 3.5700302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:19,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.65976 samples/s/p 1:27:19 } +2024-07-30 04:42:22,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2545/ 3125], loss: 0.206, per_step_time: 1414ms, lr: 3.5667192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:22,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.65616 samples/s/p 1:27:20 } +2024-07-30 04:42:25,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2547/ 3125], loss: 0.118, per_step_time: 1414ms, lr: 3.563409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:25,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.65387 samples/s/p 1:27:19 } +2024-07-30 04:42:28,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2549/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 3.5601004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:28,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.65813 samples/s/p 1:27:12 } +2024-07-30 04:42:31,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2551/ 3125], loss: 0.222, per_step_time: 1412ms, lr: 3.5567923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:31,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.66213 samples/s/p 1:27:06 } +2024-07-30 04:42:34,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2553/ 3125], loss: 0.078, per_step_time: 1414ms, lr: 3.5534852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:34,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.65532 samples/s/p 1:27:09 } +2024-07-30 04:42:36,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2555/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 3.5501782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:36,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.65530 samples/s/p 1:27:06 } +2024-07-30 04:42:39,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2557/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 3.546872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:39,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.65987 samples/s/p 1:26:59 } +2024-07-30 04:42:42,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2559/ 3125], loss: 0.431, per_step_time: 1413ms, lr: 3.5435658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:42,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.66135 samples/s/p 1:26:55 } +2024-07-30 04:42:45,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2561/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 3.5402613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:45,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.66147 samples/s/p 1:26:52 } +2024-07-30 04:42:48,231 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2563/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 3.5369574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:48,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.65968 samples/s/p 1:26:51 } +2024-07-30 04:42:51,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2565/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 3.533654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:51,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.65953 samples/s/p 1:26:48 } +2024-07-30 04:42:53,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2567/ 3125], loss: 0.426, per_step_time: 1413ms, lr: 3.5303517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:53,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.66031 samples/s/p 1:26:45 } +2024-07-30 04:42:56,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2569/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 3.5270493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:56,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.66038 samples/s/p 1:26:42 } +2024-07-30 04:42:59,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2571/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 3.5237483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:59,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.66056 samples/s/p 1:26:39 } +2024-07-30 04:43:02,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2573/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 3.5204469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:02,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.65771 samples/s/p 1:26:39 } +2024-07-30 04:43:05,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2575/ 3125], loss: 0.327, per_step_time: 1414ms, lr: 3.5171472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:05,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.65564 samples/s/p 1:26:38 } +2024-07-30 04:43:08,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2577/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 3.5138485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:08,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.66041 samples/s/p 1:26:31 } +2024-07-30 04:43:10,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2579/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 3.5105502e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:10,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.65929 samples/s/p 1:26:29 } +2024-07-30 04:43:13,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2581/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 3.5072524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:13,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.66060 samples/s/p 1:26:25 } +2024-07-30 04:43:16,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2583/ 3125], loss: 0.098, per_step_time: 1413ms, lr: 3.5039554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:16,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.65851 samples/s/p 1:26:24 } +2024-07-30 04:43:19,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2585/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 3.5006594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:19,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.66013 samples/s/p 1:26:20 } +2024-07-30 04:43:22,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2587/ 3125], loss: 0.173, per_step_time: 1415ms, lr: 3.4973639e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:22,245 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.65308 samples/s/p 1:26:23 } +2024-07-30 04:43:25,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2589/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 3.4940683e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:25,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.65902 samples/s/p 1:26:15 } +2024-07-30 04:43:27,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2591/ 3125], loss: 0.183, per_step_time: 1412ms, lr: 3.4907746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:27,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.66220 samples/s/p 1:26:09 } +2024-07-30 04:43:30,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2593/ 3125], loss: 0.070, per_step_time: 1414ms, lr: 3.4874804e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:30,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.65551 samples/s/p 1:26:13 } +2024-07-30 04:43:33,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2595/ 3125], loss: 0.266, per_step_time: 1414ms, lr: 3.4841883e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:33,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.65765 samples/s/p 1:26:08 } +2024-07-30 04:43:36,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2597/ 3125], loss: 0.341, per_step_time: 1414ms, lr: 3.4808963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:36,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.65645 samples/s/p 1:26:06 } +2024-07-30 04:43:39,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2599/ 3125], loss: 0.383, per_step_time: 1414ms, lr: 3.4776056e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:39,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.65598 samples/s/p 1:26:04 } +2024-07-30 04:43:42,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2601/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 3.4743143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:42,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.65812 samples/s/p 1:25:59 } +2024-07-30 04:43:44,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2603/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 3.4710242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:44,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.66006 samples/s/p 1:25:54 } +2024-07-30 04:43:47,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2605/ 3125], loss: 0.440, per_step_time: 1413ms, lr: 3.467735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:47,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.65991 samples/s/p 1:25:52 } +2024-07-30 04:43:50,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2607/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 3.4644468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:50,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.65858 samples/s/p 1:25:50 } +2024-07-30 04:43:53,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2609/ 3125], loss: 0.295, per_step_time: 1414ms, lr: 3.4611594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:53,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.65745 samples/s/p 1:25:48 } +2024-07-30 04:43:56,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2611/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 3.4578727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:56,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.66120 samples/s/p 1:25:42 } +2024-07-30 04:43:59,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2613/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 3.4545865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:59,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.65866 samples/s/p 1:25:41 } +2024-07-30 04:44:01,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2615/ 3125], loss: 0.166, per_step_time: 1412ms, lr: 3.4513014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:01,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.66177 samples/s/p 1:25:36 } +2024-07-30 04:44:04,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2617/ 3125], loss: 0.123, per_step_time: 1413ms, lr: 3.4480156e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:04,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.65821 samples/s/p 1:25:36 } +2024-07-30 04:44:07,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2619/ 3125], loss: 0.152, per_step_time: 1414ms, lr: 3.444732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:07,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.65631 samples/s/p 1:25:35 } +2024-07-30 04:44:10,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2621/ 3125], loss: 0.879, per_step_time: 1413ms, lr: 3.4414493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:10,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.65832 samples/s/p 1:25:30 } +2024-07-30 04:44:13,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2623/ 3125], loss: 0.192, per_step_time: 1415ms, lr: 3.438167e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:13,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.65167 samples/s/p 1:25:34 } +2024-07-30 04:44:16,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2625/ 3125], loss: 0.056, per_step_time: 1418ms, lr: 3.434885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:16,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.64032 samples/s/p 1:25:41 } +2024-07-30 04:44:18,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2627/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 3.4316042e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:18,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.66041 samples/s/p 1:25:20 } +2024-07-30 04:44:21,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2629/ 3125], loss: 0.289, per_step_time: 1412ms, lr: 3.4283244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:21,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.66201 samples/s/p 1:25:16 } +2024-07-30 04:44:24,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2631/ 3125], loss: 0.300, per_step_time: 1412ms, lr: 3.4250438e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:24,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.66256 samples/s/p 1:25:12 } +2024-07-30 04:44:27,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2633/ 3125], loss: 0.124, per_step_time: 1415ms, lr: 3.4217655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:27,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.65119 samples/s/p 1:25:20 } +2024-07-30 04:44:30,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2635/ 3125], loss: 0.221, per_step_time: 1412ms, lr: 3.4184877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:30,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.66228 samples/s/p 1:25:07 } +2024-07-30 04:44:33,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2637/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 3.4152101e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:33,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.66027 samples/s/p 1:25:06 } +2024-07-30 04:44:35,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2639/ 3125], loss: 0.533, per_step_time: 1413ms, lr: 3.4119344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:35,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.65926 samples/s/p 1:25:04 } +2024-07-30 04:44:38,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2641/ 3125], loss: 0.310, per_step_time: 1415ms, lr: 3.4086588e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:38,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.65306 samples/s/p 1:25:07 } +2024-07-30 04:44:41,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2643/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 3.405384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:41,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.66009 samples/s/p 1:24:58 } +2024-07-30 04:44:44,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2645/ 3125], loss: 0.170, per_step_time: 1412ms, lr: 3.402109e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:44,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.66328 samples/s/p 1:24:52 } +2024-07-30 04:44:47,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2647/ 3125], loss: 0.377, per_step_time: 1413ms, lr: 3.3988356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:47,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.65995 samples/s/p 1:24:52 } +2024-07-30 04:44:50,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2649/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 3.3955628e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:50,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.66011 samples/s/p 1:24:49 } +2024-07-30 04:44:52,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2651/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 3.3922913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:52,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.66015 samples/s/p 1:24:46 } +2024-07-30 04:44:55,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2653/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 3.3890205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:55,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.65927 samples/s/p 1:24:44 } +2024-07-30 04:44:58,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2655/ 3125], loss: 0.244, per_step_time: 1414ms, lr: 3.3857502e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:58,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.65514 samples/s/p 1:24:45 } +2024-07-30 04:45:01,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2657/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 3.3824806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:01,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.65784 samples/s/p 1:24:40 } +2024-07-30 04:45:04,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2659/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 3.3792119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:04,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.66027 samples/s/p 1:24:35 } +2024-07-30 04:45:07,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2661/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 3.3759432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:07,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.65962 samples/s/p 1:24:33 } +2024-07-30 04:45:09,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2663/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 3.3726762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:09,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.65848 samples/s/p 1:24:31 } +2024-07-30 04:45:12,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2665/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 3.36941e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:12,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.65940 samples/s/p 1:24:27 } +2024-07-30 04:45:15,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2667/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 3.3661445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:15,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.65787 samples/s/p 1:24:26 } +2024-07-30 04:45:18,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2669/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 3.3628792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:18,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.65810 samples/s/p 1:24:23 } +2024-07-30 04:45:21,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2671/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 3.3596154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:21,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.66055 samples/s/p 1:24:18 } +2024-07-30 04:45:24,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2673/ 3125], loss: 0.335, per_step_time: 1413ms, lr: 3.3563524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:24,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.66124 samples/s/p 1:24:14 } +2024-07-30 04:45:26,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2675/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 3.353089e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:26,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.66137 samples/s/p 1:24:11 } +2024-07-30 04:45:29,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2677/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 3.3498275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:29,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.65850 samples/s/p 1:24:11 } +2024-07-30 04:45:32,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2679/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 3.3465665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:32,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.65960 samples/s/p 1:24:07 } +2024-07-30 04:45:35,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2681/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 3.3433062e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:35,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.65993 samples/s/p 1:24:04 } +2024-07-30 04:45:38,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2683/ 3125], loss: 0.151, per_step_time: 1413ms, lr: 3.340047e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:38,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.65980 samples/s/p 1:24:01 } +2024-07-30 04:45:41,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2685/ 3125], loss: 0.134, per_step_time: 1415ms, lr: 3.3367887e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:41,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.65341 samples/s/p 1:24:04 } +2024-07-30 04:45:43,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2687/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 3.333531e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:43,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.66131 samples/s/p 1:23:54 } +2024-07-30 04:45:46,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2689/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 3.3302733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:46,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |███████████████████████████████ | 5.66127 samples/s/p 1:23:52 } +2024-07-30 04:45:49,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2691/ 3125], loss: 0.316, per_step_time: 1412ms, lr: 3.3270173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:49,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |███████████████████████████████ | 5.66238 samples/s/p 1:23:48 } +2024-07-30 04:45:52,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2693/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 3.3237618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:52,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.65987 samples/s/p 1:23:47 } +2024-07-30 04:45:55,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2695/ 3125], loss: 0.215, per_step_time: 1416ms, lr: 3.3205074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:55,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.64653 samples/s/p 1:23:56 } +2024-07-30 04:45:58,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2697/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 3.3172535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:58,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.66107 samples/s/p 1:23:40 } +2024-07-30 04:46:00,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2699/ 3125], loss: 0.429, per_step_time: 1413ms, lr: 3.3140009e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:00,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.66069 samples/s/p 1:23:38 } +2024-07-30 04:46:03,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2701/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 3.3107483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:03,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.65920 samples/s/p 1:23:36 } +2024-07-30 04:46:06,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2703/ 3125], loss: 0.354, per_step_time: 1414ms, lr: 3.3074969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:06,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.65760 samples/s/p 1:23:35 } +2024-07-30 04:46:09,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2705/ 3125], loss: 0.235, per_step_time: 1413ms, lr: 3.3042456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:09,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.65902 samples/s/p 1:23:31 } +2024-07-30 04:46:12,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2707/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 3.3009962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:12,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.66054 samples/s/p 1:23:27 } +2024-07-30 04:46:15,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2709/ 3125], loss: 0.192, per_step_time: 1414ms, lr: 3.2977473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:15,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.65400 samples/s/p 1:23:30 } +2024-07-30 04:46:17,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2711/ 3125], loss: 0.232, per_step_time: 1416ms, lr: 3.2944995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:17,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.64858 samples/s/p 1:23:32 } +2024-07-30 04:46:20,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2713/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 3.291252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:20,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.65777 samples/s/p 1:23:21 } +2024-07-30 04:46:23,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2715/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 3.2880055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:23,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.66057 samples/s/p 1:23:15 } +2024-07-30 04:46:26,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2717/ 3125], loss: 0.102, per_step_time: 1413ms, lr: 3.2847588e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:26,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.66164 samples/s/p 1:23:12 } +2024-07-30 04:46:29,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2719/ 3125], loss: 0.109, per_step_time: 1413ms, lr: 3.2815146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:29,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.66038 samples/s/p 1:23:10 } +2024-07-30 04:46:32,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2721/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 3.2782705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:32,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.66144 samples/s/p 1:23:06 } +2024-07-30 04:46:35,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2723/ 3125], loss: 0.164, per_step_time: 1413ms, lr: 3.275028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:35,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.65909 samples/s/p 1:23:05 } +2024-07-30 04:46:37,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2725/ 3125], loss: 0.292, per_step_time: 1413ms, lr: 3.2717846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:37,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.66034 samples/s/p 1:23:02 } +2024-07-30 04:46:40,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2727/ 3125], loss: 0.052, per_step_time: 1413ms, lr: 3.2685434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:40,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.66123 samples/s/p 1:22:58 } +2024-07-30 04:46:43,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2729/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 3.265303e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:43,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.65859 samples/s/p 1:22:57 } +2024-07-30 04:46:46,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2731/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 3.2620633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:46,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.66108 samples/s/p 1:22:52 } +2024-07-30 04:46:49,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2733/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 3.2588234e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:49,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.65921 samples/s/p 1:22:51 } +2024-07-30 04:46:52,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2735/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 3.2555854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:52,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.65839 samples/s/p 1:22:49 } +2024-07-30 04:46:54,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2737/ 3125], loss: 0.227, per_step_time: 1414ms, lr: 3.2523476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:54,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.65632 samples/s/p 1:22:48 } +2024-07-30 04:46:57,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2739/ 3125], loss: 0.217, per_step_time: 1428ms, lr: 3.2491112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:57,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.60154 samples/s/p 1:23:34 } +2024-07-30 04:47:00,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2741/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 3.2458759e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:00,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.65952 samples/s/p 1:22:40 } +2024-07-30 04:47:03,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2743/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 3.242641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:03,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.65924 samples/s/p 1:22:37 } +2024-07-30 04:47:06,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2745/ 3125], loss: 0.425, per_step_time: 1413ms, lr: 3.2394066e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:06,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.66107 samples/s/p 1:22:33 } +2024-07-30 04:47:09,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2747/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 3.236173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:09,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.66053 samples/s/p 1:22:30 } +2024-07-30 04:47:11,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2749/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 3.2329403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:11,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.66080 samples/s/p 1:22:27 } +2024-07-30 04:47:14,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2751/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 3.2297091e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:14,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.66141 samples/s/p 1:22:24 } +2024-07-30 04:47:17,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2753/ 3125], loss: 0.145, per_step_time: 1413ms, lr: 3.2264786e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:17,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.66026 samples/s/p 1:22:22 } +2024-07-30 04:47:20,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2755/ 3125], loss: 0.465, per_step_time: 1413ms, lr: 3.2232485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:20,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.65893 samples/s/p 1:22:20 } +2024-07-30 04:47:23,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2757/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 3.2200196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:23,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.66142 samples/s/p 1:22:15 } +2024-07-30 04:47:26,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2759/ 3125], loss: 0.294, per_step_time: 1413ms, lr: 3.2167916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:26,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.65932 samples/s/p 1:22:14 } +2024-07-30 04:47:28,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2761/ 3125], loss: 0.275, per_step_time: 1414ms, lr: 3.2135636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:28,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.65677 samples/s/p 1:22:14 } +2024-07-30 04:47:31,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2763/ 3125], loss: 0.136, per_step_time: 1413ms, lr: 3.2103371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:31,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.65784 samples/s/p 1:22:10 } +2024-07-30 04:47:34,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2765/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 3.2071118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:34,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.65998 samples/s/p 1:22:05 } +2024-07-30 04:47:37,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2767/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 3.2038872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:37,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.66042 samples/s/p 1:22:02 } +2024-07-30 04:47:40,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2769/ 3125], loss: 0.434, per_step_time: 1413ms, lr: 3.200663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:40,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.66128 samples/s/p 1:21:59 } +2024-07-30 04:47:43,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2771/ 3125], loss: 0.446, per_step_time: 1413ms, lr: 3.1974405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:43,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.65895 samples/s/p 1:21:58 } +2024-07-30 04:47:45,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2773/ 3125], loss: 0.228, per_step_time: 1414ms, lr: 3.1942182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:45,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.65749 samples/s/p 1:21:56 } +2024-07-30 04:47:48,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2775/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 3.190996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:48,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.65805 samples/s/p 1:21:53 } +2024-07-30 04:47:51,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2777/ 3125], loss: 0.291, per_step_time: 1415ms, lr: 3.1877757e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:51,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.65255 samples/s/p 1:21:55 } +2024-07-30 04:47:54,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2779/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 3.1845566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:54,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.66089 samples/s/p 1:21:45 } +2024-07-30 04:47:57,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2781/ 3125], loss: 0.353, per_step_time: 1413ms, lr: 3.1813377e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:57,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.65991 samples/s/p 1:21:43 } +2024-07-30 04:48:00,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2783/ 3125], loss: 0.294, per_step_time: 1412ms, lr: 3.1781199e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:00,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.66186 samples/s/p 1:21:38 } +2024-07-30 04:48:02,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2785/ 3125], loss: 0.113, per_step_time: 1413ms, lr: 3.1749032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:02,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.66022 samples/s/p 1:21:37 } +2024-07-30 04:48:05,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2787/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 3.171687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:05,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.66059 samples/s/p 1:21:34 } +2024-07-30 04:48:08,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2789/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 3.1684717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:08,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.66049 samples/s/p 1:21:31 } +2024-07-30 04:48:11,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2791/ 3125], loss: 0.480, per_step_time: 1413ms, lr: 3.1652569e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:11,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.66096 samples/s/p 1:21:28 } +2024-07-30 04:48:14,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2793/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 3.162043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:14,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.65956 samples/s/p 1:21:26 } +2024-07-30 04:48:17,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2795/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 3.1588309e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:17,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.65979 samples/s/p 1:21:23 } +2024-07-30 04:48:19,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2797/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 3.1556194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:19,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.66107 samples/s/p 1:21:19 } +2024-07-30 04:48:22,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2799/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 3.152409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:22,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.66166 samples/s/p 1:21:16 } +2024-07-30 04:48:25,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2801/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 3.1491986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:25,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.65935 samples/s/p 1:21:15 } +2024-07-30 04:48:28,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2803/ 3125], loss: 0.385, per_step_time: 1414ms, lr: 3.1459897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:28,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.65741 samples/s/p 1:21:14 } +2024-07-30 04:48:31,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2805/ 3125], loss: 0.419, per_step_time: 1412ms, lr: 3.1427805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:31,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.66176 samples/s/p 1:21:07 } +2024-07-30 04:48:34,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2807/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 3.1395732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:34,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.65860 samples/s/p 1:21:07 } +2024-07-30 04:48:36,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2809/ 3125], loss: 0.219, per_step_time: 1414ms, lr: 3.136367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:36,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.65631 samples/s/p 1:21:06 } +2024-07-30 04:48:39,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2811/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 3.133162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:39,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.66036 samples/s/p 1:21:00 } +2024-07-30 04:48:42,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2813/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 3.1299573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:42,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.65886 samples/s/p 1:20:58 } +2024-07-30 04:48:45,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2815/ 3125], loss: 0.597, per_step_time: 1413ms, lr: 3.1267534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:45,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.65837 samples/s/p 1:20:56 } +2024-07-30 04:48:48,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2817/ 3125], loss: 0.322, per_step_time: 1415ms, lr: 3.1235509e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:48,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.65223 samples/s/p 1:20:58 } +2024-07-30 04:48:51,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2819/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 3.1203479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:51,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.65838 samples/s/p 1:20:50 } +2024-07-30 04:48:53,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2821/ 3125], loss: 0.224, per_step_time: 1412ms, lr: 3.1171471e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:53,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.66202 samples/s/p 1:20:44 } +2024-07-30 04:48:56,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2823/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 3.1139475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:56,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.65936 samples/s/p 1:20:44 } +2024-07-30 04:48:59,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2825/ 3125], loss: 0.138, per_step_time: 1412ms, lr: 3.110748e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:59,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.66174 samples/s/p 1:20:39 } +2024-07-30 04:49:02,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2827/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 3.1075494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:02,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.66097 samples/s/p 1:20:37 } +2024-07-30 04:49:05,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2829/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 3.1043523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:05,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.66052 samples/s/p 1:20:34 } +2024-07-30 04:49:08,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2831/ 3125], loss: 0.503, per_step_time: 1413ms, lr: 3.1011564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:08,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.65966 samples/s/p 1:20:32 } +2024-07-30 04:49:10,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2833/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 3.0979597e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:10,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.65789 samples/s/p 1:20:31 } +2024-07-30 04:49:13,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2835/ 3125], loss: 0.214, per_step_time: 1418ms, lr: 3.094765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:13,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.63950 samples/s/p 1:20:44 } +2024-07-30 04:49:16,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2837/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 3.0915708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:16,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.66146 samples/s/p 1:20:22 } +2024-07-30 04:49:19,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2839/ 3125], loss: 0.136, per_step_time: 1413ms, lr: 3.0883782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:19,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.66152 samples/s/p 1:20:19 } +2024-07-30 04:49:22,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2841/ 3125], loss: 0.094, per_step_time: 1412ms, lr: 3.0851863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:22,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.66230 samples/s/p 1:20:16 } +2024-07-30 04:49:25,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2843/ 3125], loss: 0.482, per_step_time: 1413ms, lr: 3.0819954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:25,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.65910 samples/s/p 1:20:16 } +2024-07-30 04:49:27,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2845/ 3125], loss: 0.384, per_step_time: 1415ms, lr: 3.0788058e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:27,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.65052 samples/s/p 1:20:20 } +2024-07-30 04:49:30,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2847/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 3.0756155e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:30,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.65917 samples/s/p 1:20:10 } +2024-07-30 04:49:33,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2849/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 3.0724268e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:33,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.65935 samples/s/p 1:20:07 } +2024-07-30 04:49:36,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2851/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 3.0692397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:36,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.65947 samples/s/p 1:20:04 } +2024-07-30 04:49:39,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2853/ 3125], loss: 0.544, per_step_time: 1413ms, lr: 3.0660533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:39,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.65924 samples/s/p 1:20:02 } +2024-07-30 04:49:42,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2855/ 3125], loss: 0.314, per_step_time: 1412ms, lr: 3.062868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:42,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.66192 samples/s/p 1:19:56 } +2024-07-30 04:49:44,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2857/ 3125], loss: 0.390, per_step_time: 1413ms, lr: 3.0596836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:44,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.66020 samples/s/p 1:19:55 } +2024-07-30 04:49:47,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2859/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 3.0564995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:47,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.66134 samples/s/p 1:19:51 } +2024-07-30 04:49:50,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2861/ 3125], loss: 0.190, per_step_time: 1412ms, lr: 3.053317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:50,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.66174 samples/s/p 1:19:48 } +2024-07-30 04:49:53,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2863/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 3.0501344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:53,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.66069 samples/s/p 1:19:46 } +2024-07-30 04:49:56,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2865/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 3.0469537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:56,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.66167 samples/s/p 1:19:43 } +2024-07-30 04:49:59,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2867/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 3.0437736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:59,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.66085 samples/s/p 1:19:40 } +2024-07-30 04:50:01,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2869/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 3.040595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:01,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.66127 samples/s/p 1:19:37 } +2024-07-30 04:50:04,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2871/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 3.0374165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:04,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |███████████████████████████████ | 5.65991 samples/s/p 1:19:36 } +2024-07-30 04:50:07,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2873/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 3.0342396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:07,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |███████████████████████████████ | 5.65609 samples/s/p 1:19:36 } +2024-07-30 04:50:10,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2875/ 3125], loss: 0.374, per_step_time: 1415ms, lr: 3.0310637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:10,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.65309 samples/s/p 1:19:36 } +2024-07-30 04:50:13,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2877/ 3125], loss: 0.305, per_step_time: 1414ms, lr: 3.0278873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:13,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.65709 samples/s/p 1:19:29 } +2024-07-30 04:50:16,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2879/ 3125], loss: 0.043, per_step_time: 1419ms, lr: 3.0247134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:16,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.63440 samples/s/p 1:19:46 } +2024-07-30 04:50:18,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2881/ 3125], loss: 0.512, per_step_time: 1413ms, lr: 3.02154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:18,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.66061 samples/s/p 1:19:21 } +2024-07-30 04:50:21,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2883/ 3125], loss: 0.264, per_step_time: 1412ms, lr: 3.0183671e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:21,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.66192 samples/s/p 1:19:17 } +2024-07-30 04:50:24,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2885/ 3125], loss: 0.169, per_step_time: 1414ms, lr: 3.015196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:24,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.65691 samples/s/p 1:19:18 } +2024-07-30 04:50:27,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2887/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 3.012026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:27,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.66060 samples/s/p 1:19:12 } +2024-07-30 04:50:30,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2889/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 3.008856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:30,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.66032 samples/s/p 1:19:10 } +2024-07-30 04:50:33,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2891/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 3.0056867e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:33,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.66098 samples/s/p 1:19:06 } +2024-07-30 04:50:35,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2893/ 3125], loss: 0.385, per_step_time: 1412ms, lr: 3.0025187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:35,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.66174 samples/s/p 1:19:03 } +2024-07-30 04:50:38,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2895/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 2.999352e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:38,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.65925 samples/s/p 1:19:02 } +2024-07-30 04:50:41,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2897/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 2.9961866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:41,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.65858 samples/s/p 1:19:00 } +2024-07-30 04:50:44,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2899/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 2.9930218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:44,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.66059 samples/s/p 1:18:55 } +2024-07-30 04:50:47,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2901/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 2.9898583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:47,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.65937 samples/s/p 1:18:54 } +2024-07-30 04:50:50,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2903/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 2.9866949e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:50,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.66083 samples/s/p 1:18:50 } +2024-07-30 04:50:52,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2905/ 3125], loss: 0.322, per_step_time: 1413ms, lr: 2.9835319e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:52,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.66070 samples/s/p 1:18:47 } +2024-07-30 04:50:55,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2907/ 3125], loss: 0.115, per_step_time: 1414ms, lr: 2.980371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:55,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.65582 samples/s/p 1:18:48 } +2024-07-30 04:50:58,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2909/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 2.9772114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:58,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.65868 samples/s/p 1:18:43 } +2024-07-30 04:51:01,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2911/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 2.9740524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:01,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.66012 samples/s/p 1:18:39 } +2024-07-30 04:51:04,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2913/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 2.9708945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:04,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.65963 samples/s/p 1:18:36 } +2024-07-30 04:51:07,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2915/ 3125], loss: 0.250, per_step_time: 1412ms, lr: 2.9677371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:07,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.66196 samples/s/p 1:18:32 } +2024-07-30 04:51:09,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2917/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 2.9645812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:09,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.65952 samples/s/p 1:18:31 } +2024-07-30 04:51:12,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2919/ 3125], loss: 0.264, per_step_time: 1414ms, lr: 2.961425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:12,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.65421 samples/s/p 1:18:32 } +2024-07-30 04:51:15,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2921/ 3125], loss: 0.233, per_step_time: 1414ms, lr: 2.958271e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:15,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.65750 samples/s/p 1:18:27 } +2024-07-30 04:51:18,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2923/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 2.9551177e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:18,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.65827 samples/s/p 1:18:23 } +2024-07-30 04:51:21,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2925/ 3125], loss: 0.236, per_step_time: 1412ms, lr: 2.9519658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:21,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.66237 samples/s/p 1:18:17 } +2024-07-30 04:51:24,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2927/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 2.9488142e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:24,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.66114 samples/s/p 1:18:15 } +2024-07-30 04:51:26,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2929/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 2.9456642e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:26,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.66170 samples/s/p 1:18:12 } +2024-07-30 04:51:29,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2931/ 3125], loss: 0.321, per_step_time: 1413ms, lr: 2.942515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:29,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.66015 samples/s/p 1:18:11 } +2024-07-30 04:51:32,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2933/ 3125], loss: 0.302, per_step_time: 1414ms, lr: 2.9393668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:32,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.65757 samples/s/p 1:18:10 } +2024-07-30 04:51:35,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2935/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 2.9362188e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:35,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.65949 samples/s/p 1:18:05 } +2024-07-30 04:51:38,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2937/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 2.9330724e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:38,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.65939 samples/s/p 1:18:03 } +2024-07-30 04:51:41,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2939/ 3125], loss: 0.116, per_step_time: 1413ms, lr: 2.9299267e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:41,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.66119 samples/s/p 1:17:58 } +2024-07-30 04:51:43,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2941/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 2.9267826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:43,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.65787 samples/s/p 1:17:58 } +2024-07-30 04:51:46,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2943/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 2.9236394e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:46,808 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.65969 samples/s/p 1:17:54 } +2024-07-30 04:51:49,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2945/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 2.920497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:49,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.66116 samples/s/p 1:17:50 } +2024-07-30 04:51:52,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2947/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 2.917356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:52,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.65884 samples/s/p 1:17:49 } +2024-07-30 04:51:55,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2949/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 2.9142147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:55,310 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.65955 samples/s/p 1:17:46 } +2024-07-30 04:51:58,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2951/ 3125], loss: 0.022, per_step_time: 1413ms, lr: 2.9110752e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:58,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.66102 samples/s/p 1:17:42 } +2024-07-30 04:52:00,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2953/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 2.9079372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:00,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.65898 samples/s/p 1:17:40 } +2024-07-30 04:52:03,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2955/ 3125], loss: 0.157, per_step_time: 1412ms, lr: 2.904799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:03,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.66290 samples/s/p 1:17:34 } +2024-07-30 04:52:06,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2957/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 2.9016626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:06,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.66019 samples/s/p 1:17:34 } +2024-07-30 04:52:09,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2959/ 3125], loss: 0.113, per_step_time: 1413ms, lr: 2.8985273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:09,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.66004 samples/s/p 1:17:31 } +2024-07-30 04:52:12,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2961/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 2.8953932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:12,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.66146 samples/s/p 1:17:27 } +2024-07-30 04:52:15,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2963/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 2.8922586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:15,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.65987 samples/s/p 1:17:26 } +2024-07-30 04:52:17,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2965/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 2.8891266e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:17,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.66057 samples/s/p 1:17:22 } +2024-07-30 04:52:20,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2967/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 2.8859954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:20,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.65785 samples/s/p 1:17:22 } +2024-07-30 04:52:23,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2969/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 2.882865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:23,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.66097 samples/s/p 1:17:16 } +2024-07-30 04:52:26,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2971/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 2.8797358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:26,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.66058 samples/s/p 1:17:14 } +2024-07-30 04:52:29,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2973/ 3125], loss: 0.339, per_step_time: 1414ms, lr: 2.8766076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:29,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.65670 samples/s/p 1:17:14 } +2024-07-30 04:52:32,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2975/ 3125], loss: 0.189, per_step_time: 1414ms, lr: 2.8734794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:32,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.65765 samples/s/p 1:17:10 } +2024-07-30 04:52:34,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2977/ 3125], loss: 0.048, per_step_time: 1415ms, lr: 2.8703535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:34,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.65285 samples/s/p 1:17:12 } +2024-07-30 04:52:37,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2979/ 3125], loss: 0.607, per_step_time: 1414ms, lr: 2.867227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:37,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.65621 samples/s/p 1:17:06 } +2024-07-30 04:52:40,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2981/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 2.864103e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:40,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.65961 samples/s/p 1:17:00 } +2024-07-30 04:52:43,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2983/ 3125], loss: 0.097, per_step_time: 1413ms, lr: 2.86098e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:43,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.66160 samples/s/p 1:16:56 } +2024-07-30 04:52:46,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2985/ 3125], loss: 0.277, per_step_time: 1412ms, lr: 2.857858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:46,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.66190 samples/s/p 1:16:53 } +2024-07-30 04:52:49,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2987/ 3125], loss: 0.051, per_step_time: 1413ms, lr: 2.8547367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:49,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.66107 samples/s/p 1:16:51 } +2024-07-30 04:52:52,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2989/ 3125], loss: 0.155, per_step_time: 1444ms, lr: 2.8516167e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:52,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.54004 samples/s/p 1:18:28 } +2024-07-30 04:52:54,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2991/ 3125], loss: 0.142, per_step_time: 1413ms, lr: 2.8484965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:54,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.66168 samples/s/p 1:16:44 } +2024-07-30 04:52:57,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2993/ 3125], loss: 0.114, per_step_time: 1413ms, lr: 2.8453785e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:57,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.65878 samples/s/p 1:16:44 } +2024-07-30 04:53:00,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2995/ 3125], loss: 0.278, per_step_time: 1415ms, lr: 2.8422617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:00,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.65172 samples/s/p 1:16:47 } +2024-07-30 04:53:03,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2997/ 3125], loss: 0.344, per_step_time: 1413ms, lr: 2.8391455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:03,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.65830 samples/s/p 1:16:39 } +2024-07-30 04:53:06,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2999/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 2.8360298e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:06,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.65979 samples/s/p 1:16:35 } +2024-07-30 04:53:09,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3001/ 3125], loss: 0.242, per_step_time: 1414ms, lr: 2.832916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:09,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.65501 samples/s/p 1:16:36 } +2024-07-30 04:53:11,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3003/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 2.8298032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:11,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.66036 samples/s/p 1:16:29 } +2024-07-30 04:53:14,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3005/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 2.8266911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:14,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.65872 samples/s/p 1:16:27 } +2024-07-30 04:53:17,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3007/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 2.8235793e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:17,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.65910 samples/s/p 1:16:24 } +2024-07-30 04:53:20,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3009/ 3125], loss: 0.139, per_step_time: 1413ms, lr: 2.8204697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:20,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.66155 samples/s/p 1:16:19 } +2024-07-30 04:53:23,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3011/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 2.817361e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:23,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.66093 samples/s/p 1:16:17 } +2024-07-30 04:53:26,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3013/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 2.8142535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:26,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.66027 samples/s/p 1:16:15 } +2024-07-30 04:53:28,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3015/ 3125], loss: 0.209, per_step_time: 1412ms, lr: 2.811147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:28,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.66229 samples/s/p 1:16:10 } +2024-07-30 04:53:31,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3017/ 3125], loss: 0.380, per_step_time: 1419ms, lr: 2.8080415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:31,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.63705 samples/s/p 1:16:28 } +2024-07-30 04:53:34,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3019/ 3125], loss: 0.323, per_step_time: 1413ms, lr: 2.8049358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:34,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.65911 samples/s/p 1:16:07 } +2024-07-30 04:53:37,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3021/ 3125], loss: 0.158, per_step_time: 1413ms, lr: 2.8018326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:37,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.65861 samples/s/p 1:16:05 } +2024-07-30 04:53:40,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3023/ 3125], loss: 0.125, per_step_time: 1413ms, lr: 2.798729e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:40,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.66068 samples/s/p 1:16:00 } +2024-07-30 04:53:43,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3025/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 2.7956276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:43,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.66028 samples/s/p 1:15:58 } +2024-07-30 04:53:45,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3027/ 3125], loss: 0.122, per_step_time: 1413ms, lr: 2.7925273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:45,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.65808 samples/s/p 1:15:57 } +2024-07-30 04:53:48,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3029/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 2.7894282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:48,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.65810 samples/s/p 1:15:54 } +2024-07-30 04:53:51,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3031/ 3125], loss: 0.483, per_step_time: 1414ms, lr: 2.78633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:51,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.65579 samples/s/p 1:15:53 } +2024-07-30 04:53:54,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3033/ 3125], loss: 0.305, per_step_time: 1414ms, lr: 2.783233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:54,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.65770 samples/s/p 1:15:48 } +2024-07-30 04:53:57,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3035/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 2.7801354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:57,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.65881 samples/s/p 1:15:45 } +2024-07-30 04:54:00,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3037/ 3125], loss: 0.364, per_step_time: 1415ms, lr: 2.7770404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:00,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.65169 samples/s/p 1:15:48 } +2024-07-30 04:54:02,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3039/ 3125], loss: 0.401, per_step_time: 1413ms, lr: 2.7739466e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:02,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.66100 samples/s/p 1:15:37 } +2024-07-30 04:54:05,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3041/ 3125], loss: 0.106, per_step_time: 1413ms, lr: 2.7708536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:05,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.65873 samples/s/p 1:15:36 } +2024-07-30 04:54:08,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3043/ 3125], loss: 0.102, per_step_time: 1413ms, lr: 2.7677606e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:08,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.66082 samples/s/p 1:15:32 } +2024-07-30 04:54:11,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3045/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 2.7646702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:11,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.66167 samples/s/p 1:15:28 } +2024-07-30 04:54:14,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3047/ 3125], loss: 0.335, per_step_time: 1413ms, lr: 2.7615804e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:14,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.66012 samples/s/p 1:15:27 } +2024-07-30 04:54:17,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3049/ 3125], loss: 0.182, per_step_time: 1412ms, lr: 2.7584906e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:17,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.66256 samples/s/p 1:15:22 } +2024-07-30 04:54:19,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3051/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 2.755403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:19,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.66054 samples/s/p 1:15:21 } +2024-07-30 04:54:22,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3053/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 2.7523165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:22,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.65967 samples/s/p 1:15:18 } +2024-07-30 04:54:25,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3055/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 2.7492315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:25,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.65894 samples/s/p 1:15:16 } +2024-07-30 04:54:28,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3057/ 3125], loss: 0.214, per_step_time: 1414ms, lr: 2.746147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:28,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.65673 samples/s/p 1:15:15 } +2024-07-30 04:54:31,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3059/ 3125], loss: 0.276, per_step_time: 1412ms, lr: 2.7430635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:31,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |████████████████████████████████ | 5.66294 samples/s/p 1:15:07 } +2024-07-30 04:54:34,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3061/ 3125], loss: 0.202, per_step_time: 1414ms, lr: 2.7399817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:34,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |████████████████████████████████ | 5.65723 samples/s/p 1:15:09 } +2024-07-30 04:54:36,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3063/ 3125], loss: 0.301, per_step_time: 1413ms, lr: 2.7368992e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:36,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.65822 samples/s/p 1:15:06 } +2024-07-30 04:54:39,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3065/ 3125], loss: 0.355, per_step_time: 1414ms, lr: 2.7338194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:39,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.65384 samples/s/p 1:15:06 } +2024-07-30 04:54:42,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3067/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 2.7307394e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:42,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.65856 samples/s/p 1:15:00 } +2024-07-30 04:54:45,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3069/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 2.7276617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:45,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.66126 samples/s/p 1:14:55 } +2024-07-30 04:54:48,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3071/ 3125], loss: 0.504, per_step_time: 1413ms, lr: 2.7245849e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:48,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.66065 samples/s/p 1:14:52 } +2024-07-30 04:54:51,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3073/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 2.7215092e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:51,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.65930 samples/s/p 1:14:51 } +2024-07-30 04:54:53,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3075/ 3125], loss: 0.285, per_step_time: 1412ms, lr: 2.7184346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:53,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.66195 samples/s/p 1:14:46 } +2024-07-30 04:54:56,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3077/ 3125], loss: 0.393, per_step_time: 1413ms, lr: 2.715361e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:56,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.65980 samples/s/p 1:14:44 } +2024-07-30 04:54:59,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3079/ 3125], loss: 0.137, per_step_time: 1414ms, lr: 2.7122876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:59,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.65435 samples/s/p 1:14:46 } +2024-07-30 04:55:02,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3081/ 3125], loss: 0.499, per_step_time: 1413ms, lr: 2.709216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:02,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.66093 samples/s/p 1:14:38 } +2024-07-30 04:55:05,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3083/ 3125], loss: 0.220, per_step_time: 1414ms, lr: 2.7061462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:05,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.65616 samples/s/p 1:14:39 } +2024-07-30 04:55:08,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3085/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 2.7030771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:08,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.66098 samples/s/p 1:14:32 } +2024-07-30 04:55:10,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3087/ 3125], loss: 0.280, per_step_time: 1415ms, lr: 2.7000078e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:10,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.65193 samples/s/p 1:14:37 } +2024-07-30 04:55:13,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3089/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 2.6969408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:13,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.65904 samples/s/p 1:14:28 } +2024-07-30 04:55:16,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3091/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 2.6938749e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:16,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.66070 samples/s/p 1:14:24 } +2024-07-30 04:55:19,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3093/ 3125], loss: 0.408, per_step_time: 1414ms, lr: 2.6908092e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:19,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.65721 samples/s/p 1:14:24 } +2024-07-30 04:55:22,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3095/ 3125], loss: 0.365, per_step_time: 1412ms, lr: 2.6877456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:22,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.66236 samples/s/p 1:14:17 } +2024-07-30 04:55:25,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3097/ 3125], loss: 0.169, per_step_time: 1413ms, lr: 2.684683e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:25,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.65983 samples/s/p 1:14:16 } +2024-07-30 04:55:27,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3099/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 2.6816215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:27,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.66012 samples/s/p 1:14:13 } +2024-07-30 04:55:30,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3101/ 3125], loss: 0.268, per_step_time: 1412ms, lr: 2.678561e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:30,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.66226 samples/s/p 1:14:09 } +2024-07-30 04:55:33,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3103/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 2.6755022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:33,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.65813 samples/s/p 1:14:09 } +2024-07-30 04:55:36,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3105/ 3125], loss: 0.380, per_step_time: 1412ms, lr: 2.672444e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:36,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.66219 samples/s/p 1:14:03 } +2024-07-30 04:55:39,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3107/ 3125], loss: 0.395, per_step_time: 1414ms, lr: 2.6693863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:39,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.65614 samples/s/p 1:14:05 } +2024-07-30 04:55:42,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3109/ 3125], loss: 0.345, per_step_time: 1412ms, lr: 2.6663304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:42,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.66328 samples/s/p 1:13:57 } +2024-07-30 04:55:44,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3111/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 2.6632742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:44,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.66070 samples/s/p 1:13:56 } +2024-07-30 04:55:47,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3113/ 3125], loss: 0.202, per_step_time: 1415ms, lr: 2.6602208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:47,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.65343 samples/s/p 1:13:59 } +2024-07-30 04:55:50,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3115/ 3125], loss: 0.219, per_step_time: 1414ms, lr: 2.6571681e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:50,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.65638 samples/s/p 1:13:53 } +2024-07-30 04:55:53,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3117/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 2.6541168e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:53,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.65816 samples/s/p 1:13:49 } +2024-07-30 04:55:56,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3119/ 3125], loss: 0.177, per_step_time: 1412ms, lr: 2.6510663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:56,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.66268 samples/s/p 1:13:43 } +2024-07-30 04:55:59,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3121/ 3125], loss: 0.329, per_step_time: 1412ms, lr: 2.648016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:59,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.66198 samples/s/p 1:13:41 } +2024-07-30 04:56:01,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3123/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 2.644968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:01,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.65863 samples/s/p 1:13:40 } +2024-07-30 04:56:04,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3125/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 2.641921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:04,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.65965 samples/s/p 1:13:37 } +2024-07-30 04:56:07,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 2.6388755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:07,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.65853 samples/s/p 1:13:35 } +2024-07-30 04:56:10,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 4/ 3125], loss: 0.209, per_step_time: 1414ms, lr: 2.6358305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:10,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.65712 samples/s/p 1:13:33 } +2024-07-30 04:56:13,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 6/ 3125], loss: 0.401, per_step_time: 1413ms, lr: 2.632786e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:13,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.65998 samples/s/p 1:13:28 } +2024-07-30 04:56:16,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 8/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 2.6297437e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:16,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.66139 samples/s/p 1:13:24 } +2024-07-30 04:56:18,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 10/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 2.6267028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:18,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.65614 samples/s/p 1:13:25 } +2024-07-30 04:56:21,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 12/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 2.6236612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:21,808 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.65660 samples/s/p 1:13:22 } +2024-07-30 04:56:24,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 14/ 3125], loss: 0.251, per_step_time: 1414ms, lr: 2.6206224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:24,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.65485 samples/s/p 1:13:21 } +2024-07-30 04:56:27,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 16/ 3125], loss: 0.254, per_step_time: 1414ms, lr: 2.6175844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:27,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.65412 samples/s/p 1:13:18 } +2024-07-30 04:56:30,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 18/ 3125], loss: 0.416, per_step_time: 1413ms, lr: 2.6145476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:30,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.66114 samples/s/p 1:13:10 } +2024-07-30 04:56:33,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 20/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 2.6115122e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:33,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.65899 samples/s/p 1:13:09 } +2024-07-30 04:56:35,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 22/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 2.6084776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:35,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.65996 samples/s/p 1:13:05 } +2024-07-30 04:56:38,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 24/ 3125], loss: 0.292, per_step_time: 1413ms, lr: 2.6054445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:38,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.65943 samples/s/p 1:13:03 } +2024-07-30 04:56:41,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 26/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 2.6024115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:41,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.66061 samples/s/p 1:12:59 } +2024-07-30 04:56:44,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 28/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 2.5993802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:44,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.65957 samples/s/p 1:12:57 } +2024-07-30 04:56:47,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 30/ 3125], loss: 0.404, per_step_time: 1412ms, lr: 2.5963493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:47,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.66173 samples/s/p 1:12:53 } +2024-07-30 04:56:50,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 32/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 2.5933205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:50,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.65989 samples/s/p 1:12:51 } +2024-07-30 04:56:52,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 34/ 3125], loss: 0.275, per_step_time: 1412ms, lr: 2.5902932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:52,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.66249 samples/s/p 1:12:46 } +2024-07-30 04:56:55,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 36/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 2.5872669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:55,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.66145 samples/s/p 1:12:44 } +2024-07-30 04:56:58,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 38/ 3125], loss: 0.348, per_step_time: 1413ms, lr: 2.5842417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:58,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.66043 samples/s/p 1:12:42 } +2024-07-30 04:57:01,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 40/ 3125], loss: 0.229, per_step_time: 1412ms, lr: 2.581216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:01,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.66260 samples/s/p 1:12:38 } +2024-07-30 04:57:04,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 42/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 2.5781935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:04,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.65986 samples/s/p 1:12:37 } +2024-07-30 04:57:07,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 44/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 2.5751715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:07,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.66028 samples/s/p 1:12:34 } +2024-07-30 04:57:09,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 46/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 2.5721508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:09,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.66126 samples/s/p 1:12:30 } +2024-07-30 04:57:12,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 48/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 2.569131e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:12,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.65892 samples/s/p 1:12:29 } +2024-07-30 04:57:15,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 50/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 2.5661127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:15,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.66070 samples/s/p 1:12:25 } +2024-07-30 04:57:18,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 52/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 2.5630948e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:18,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.66108 samples/s/p 1:12:22 } +2024-07-30 04:57:21,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 54/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 2.5600777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:21,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.66165 samples/s/p 1:12:19 } +2024-07-30 04:57:24,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 56/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 2.557063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:24,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.66093 samples/s/p 1:12:17 } +2024-07-30 04:57:26,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 58/ 3125], loss: 0.320, per_step_time: 1413ms, lr: 2.5540494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:26,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.66002 samples/s/p 1:12:14 } +2024-07-30 04:57:29,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 60/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 2.5510367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:29,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.65864 samples/s/p 1:12:13 } +2024-07-30 04:57:32,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 62/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 2.5480251e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:32,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.66020 samples/s/p 1:12:09 } +2024-07-30 04:57:35,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 64/ 3125], loss: 0.206, per_step_time: 1412ms, lr: 2.5450151e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:35,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.66203 samples/s/p 1:12:04 } +2024-07-30 04:57:38,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 66/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 2.5420063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:38,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.65972 samples/s/p 1:12:03 } +2024-07-30 04:57:41,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 68/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 2.5389975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:41,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.66158 samples/s/p 1:11:59 } +2024-07-30 04:57:43,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 70/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 2.5359905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:43,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.66103 samples/s/p 1:11:57 } +2024-07-30 04:57:46,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 72/ 3125], loss: 0.413, per_step_time: 1414ms, lr: 2.532985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:46,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.65646 samples/s/p 1:11:57 } +2024-07-30 04:57:49,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 74/ 3125], loss: 0.082, per_step_time: 1413ms, lr: 2.529981e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:49,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.65970 samples/s/p 1:11:52 } +2024-07-30 04:57:52,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 76/ 3125], loss: 0.412, per_step_time: 1414ms, lr: 2.5269765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:52,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.65705 samples/s/p 1:11:51 } +2024-07-30 04:57:55,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 78/ 3125], loss: 0.093, per_step_time: 1414ms, lr: 2.5239747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:55,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.65717 samples/s/p 1:11:48 } +2024-07-30 04:57:58,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 80/ 3125], loss: 0.102, per_step_time: 1413ms, lr: 2.5209742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:58,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.66099 samples/s/p 1:11:43 } +2024-07-30 04:58:00,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 82/ 3125], loss: 0.208, per_step_time: 1414ms, lr: 2.5179743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:00,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.65498 samples/s/p 1:11:44 } +2024-07-30 04:58:03,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 84/ 3125], loss: 0.203, per_step_time: 1412ms, lr: 2.514975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:03,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.66225 samples/s/p 1:11:36 } +2024-07-30 04:58:06,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 86/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 2.5119778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:06,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.66093 samples/s/p 1:11:34 } +2024-07-30 04:58:09,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 88/ 3125], loss: 0.132, per_step_time: 1414ms, lr: 2.5089817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:09,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.65520 samples/s/p 1:11:36 } +2024-07-30 04:58:12,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 90/ 3125], loss: 0.296, per_step_time: 1414ms, lr: 2.505987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:12,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.65487 samples/s/p 1:11:33 } +2024-07-30 04:58:15,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 92/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 2.5029933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:15,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.66101 samples/s/p 1:11:26 } +2024-07-30 04:58:18,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 94/ 3125], loss: 0.059, per_step_time: 1413ms, lr: 2.5000008e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:18,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.65840 samples/s/p 1:11:25 } +2024-07-30 04:58:20,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 96/ 3125], loss: 0.201, per_step_time: 1414ms, lr: 2.4970086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:20,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.65510 samples/s/p 1:11:24 } +2024-07-30 04:58:23,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 98/ 3125], loss: 0.089, per_step_time: 1413ms, lr: 2.4940175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:23,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.66169 samples/s/p 1:11:17 } +2024-07-30 04:58:26,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 100/ 3125], loss: 0.347, per_step_time: 1412ms, lr: 2.4910285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:26,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.66191 samples/s/p 1:11:14 } +2024-07-30 04:58:29,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 102/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 2.4880408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:29,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.66102 samples/s/p 1:11:12 } +2024-07-30 04:58:32,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 104/ 3125], loss: 0.186, per_step_time: 1414ms, lr: 2.4850544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:32,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.65651 samples/s/p 1:11:12 } +2024-07-30 04:58:35,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 106/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 2.4820695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:35,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.65808 samples/s/p 1:11:08 } +2024-07-30 04:58:37,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 108/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 2.4790852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:37,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.65909 samples/s/p 1:11:04 } +2024-07-30 04:58:40,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 110/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 2.4761023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:40,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.66164 samples/s/p 1:11:00 } +2024-07-30 04:58:43,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 112/ 3125], loss: 0.174, per_step_time: 1414ms, lr: 2.4731198e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:43,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.65733 samples/s/p 1:11:00 } +2024-07-30 04:58:46,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 114/ 3125], loss: 0.257, per_step_time: 1412ms, lr: 2.4701392e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:46,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.66185 samples/s/p 1:10:54 } +2024-07-30 04:58:49,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 116/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 2.46716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:49,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.66105 samples/s/p 1:10:52 } +2024-07-30 04:58:52,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 118/ 3125], loss: 0.344, per_step_time: 1413ms, lr: 2.464182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:52,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.66083 samples/s/p 1:10:49 } +2024-07-30 04:58:54,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 120/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 2.461204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:54,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.66055 samples/s/p 1:10:46 } +2024-07-30 04:58:57,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 122/ 3125], loss: 0.334, per_step_time: 1413ms, lr: 2.4582287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:57,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |█████████████████████████████████ | 5.66012 samples/s/p 1:10:44 } +2024-07-30 04:59:00,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 124/ 3125], loss: 0.114, per_step_time: 1413ms, lr: 2.4552542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:00,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |█████████████████████████████████ | 5.66111 samples/s/p 1:10:40 } +2024-07-30 04:59:03,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 126/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 2.45228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:03,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.66050 samples/s/p 1:10:38 } +2024-07-30 04:59:06,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 128/ 3125], loss: 0.396, per_step_time: 1415ms, lr: 2.4493079e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:06,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.65241 samples/s/p 1:10:41 } +2024-07-30 04:59:09,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 130/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 2.4463372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:09,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.66156 samples/s/p 1:10:32 } +2024-07-30 04:59:11,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 132/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 2.4433677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:11,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.66017 samples/s/p 1:10:30 } +2024-07-30 04:59:14,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 134/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 2.4403994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:14,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.66139 samples/s/p 1:10:26 } +2024-07-30 04:59:17,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 136/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 2.4374324e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:17,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.65985 samples/s/p 1:10:24 } +2024-07-30 04:59:20,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 138/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 2.4344665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:20,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.65911 samples/s/p 1:10:22 } +2024-07-30 04:59:23,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 140/ 3125], loss: 0.139, per_step_time: 1414ms, lr: 2.431501e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:23,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.65590 samples/s/p 1:10:22 } +2024-07-30 04:59:26,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 142/ 3125], loss: 0.400, per_step_time: 1413ms, lr: 2.4285375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:26,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.66106 samples/s/p 1:10:15 } +2024-07-30 04:59:28,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 144/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 2.4255744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:28,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.66098 samples/s/p 1:10:12 } +2024-07-30 04:59:31,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 146/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 2.422613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:31,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.66122 samples/s/p 1:10:09 } +2024-07-30 04:59:34,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 148/ 3125], loss: 0.408, per_step_time: 1414ms, lr: 2.4196536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:34,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.65428 samples/s/p 1:10:12 } +2024-07-30 04:59:37,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 150/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 2.416695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:37,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.65895 samples/s/p 1:10:05 } +2024-07-30 04:59:40,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 152/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 2.413738e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:40,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.66109 samples/s/p 1:10:01 } +2024-07-30 04:59:43,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 154/ 3125], loss: 0.100, per_step_time: 1413ms, lr: 2.410782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:43,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.65868 samples/s/p 1:10:00 } +2024-07-30 04:59:45,858 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 156/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 2.407826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:45,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.66068 samples/s/p 1:09:55 } +2024-07-30 04:59:48,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 158/ 3125], loss: 0.271, per_step_time: 1419ms, lr: 2.4048725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:48,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.63632 samples/s/p 1:10:11 } +2024-07-30 04:59:51,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 160/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 2.4019203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:51,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.66066 samples/s/p 1:09:50 } +2024-07-30 04:59:54,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 162/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 2.3989692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:54,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.66034 samples/s/p 1:09:47 } +2024-07-30 04:59:57,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 164/ 3125], loss: 0.320, per_step_time: 1413ms, lr: 2.396018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:57,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.66169 samples/s/p 1:09:43 } +2024-07-30 05:00:00,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 166/ 3125], loss: 0.197, per_step_time: 1413ms, lr: 2.3930697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:00,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.65850 samples/s/p 1:09:43 } +2024-07-30 05:00:02,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 168/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 2.3901223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:02,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.65917 samples/s/p 1:09:40 } +2024-07-30 05:00:05,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 170/ 3125], loss: 0.350, per_step_time: 1416ms, lr: 2.3871753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:05,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.64581 samples/s/p 1:09:47 } +2024-07-30 05:00:08,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 172/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 2.3842304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:08,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.65959 samples/s/p 1:09:34 } +2024-07-30 05:00:11,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 174/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 2.3812868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:11,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.66094 samples/s/p 1:09:30 } +2024-07-30 05:00:14,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 176/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 2.3783446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:14,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.65903 samples/s/p 1:09:28 } +2024-07-30 05:00:17,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 178/ 3125], loss: 0.348, per_step_time: 1413ms, lr: 2.3754033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:17,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.65875 samples/s/p 1:09:26 } +2024-07-30 05:00:19,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 180/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 2.3724635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:19,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.65781 samples/s/p 1:09:24 } +2024-07-30 05:00:22,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 182/ 3125], loss: 0.320, per_step_time: 1414ms, lr: 2.369525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:22,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.65739 samples/s/p 1:09:21 } +2024-07-30 05:00:25,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 184/ 3125], loss: 0.459, per_step_time: 1414ms, lr: 2.3665866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:25,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.65605 samples/s/p 1:09:19 } +2024-07-30 05:00:28,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 186/ 3125], loss: 0.228, per_step_time: 1414ms, lr: 2.3636508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:28,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.65763 samples/s/p 1:09:15 } +2024-07-30 05:00:31,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 188/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 2.360715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:31,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.66082 samples/s/p 1:09:10 } +2024-07-30 05:00:34,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 190/ 3125], loss: 0.168, per_step_time: 1412ms, lr: 2.357781e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:34,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.66216 samples/s/p 1:09:06 } +2024-07-30 05:00:36,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 192/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 2.354849e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:36,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.66055 samples/s/p 1:09:05 } +2024-07-30 05:00:39,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 194/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 2.3519178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:39,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.65927 samples/s/p 1:09:03 } +2024-07-30 05:00:42,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 196/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 2.348988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:42,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.66059 samples/s/p 1:08:59 } +2024-07-30 05:00:45,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 198/ 3125], loss: 0.222, per_step_time: 1412ms, lr: 2.3460586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:45,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.66178 samples/s/p 1:08:55 } +2024-07-30 05:00:48,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 200/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 2.3431312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:48,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.66053 samples/s/p 1:08:53 } +2024-07-30 05:00:51,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 202/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 2.3402056e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:51,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.66003 samples/s/p 1:08:51 } +2024-07-30 05:00:53,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 204/ 3125], loss: 0.330, per_step_time: 1413ms, lr: 2.3372806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:53,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.65960 samples/s/p 1:08:48 } +2024-07-30 05:00:56,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 206/ 3125], loss: 0.396, per_step_time: 1413ms, lr: 2.3343575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:56,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.66148 samples/s/p 1:08:44 } +2024-07-30 05:00:59,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 208/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 2.3314344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:59,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.66092 samples/s/p 1:08:42 } +2024-07-30 05:01:02,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 210/ 3125], loss: 0.288, per_step_time: 1412ms, lr: 2.3285136e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:02,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.66219 samples/s/p 1:08:38 } +2024-07-30 05:01:05,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 212/ 3125], loss: 0.287, per_step_time: 1418ms, lr: 2.3255939e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:05,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.63929 samples/s/p 1:08:52 } +2024-07-30 05:01:08,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 214/ 3125], loss: 0.473, per_step_time: 1413ms, lr: 2.3226744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:08,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.66026 samples/s/p 1:08:34 } +2024-07-30 05:01:10,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 216/ 3125], loss: 0.241, per_step_time: 1415ms, lr: 2.3197572e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:10,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.65332 samples/s/p 1:08:36 } +2024-07-30 05:01:13,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 218/ 3125], loss: 0.399, per_step_time: 1416ms, lr: 2.3168413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:13,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.64810 samples/s/p 1:08:37 } +2024-07-30 05:01:16,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 220/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 2.313927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:16,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.66054 samples/s/p 1:08:25 } +2024-07-30 05:01:19,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 222/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 2.311014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:19,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.65954 samples/s/p 1:08:23 } +2024-07-30 05:01:22,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 224/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 2.3081018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:22,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.66138 samples/s/p 1:08:19 } +2024-07-30 05:01:25,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 226/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 2.3051914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:25,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.66122 samples/s/p 1:08:16 } +2024-07-30 05:01:27,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 228/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 2.3022812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:27,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.65959 samples/s/p 1:08:14 } +2024-07-30 05:01:30,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 230/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 2.2993727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:30,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.66075 samples/s/p 1:08:11 } +2024-07-30 05:01:33,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 232/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 2.2964653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:33,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.66097 samples/s/p 1:08:08 } +2024-07-30 05:01:36,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 234/ 3125], loss: 0.231, per_step_time: 1414ms, lr: 2.2935599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:36,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.65408 samples/s/p 1:08:10 } +2024-07-30 05:01:39,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 236/ 3125], loss: 0.349, per_step_time: 1412ms, lr: 2.2906556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:39,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.66218 samples/s/p 1:08:01 } +2024-07-30 05:01:42,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 238/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 2.287753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:42,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.65932 samples/s/p 1:08:01 } +2024-07-30 05:01:44,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 240/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 2.284851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:44,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.66101 samples/s/p 1:07:57 } +2024-07-30 05:01:47,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 242/ 3125], loss: 0.152, per_step_time: 1414ms, lr: 2.2819497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:47,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.65555 samples/s/p 1:07:58 } +2024-07-30 05:01:50,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 244/ 3125], loss: 0.308, per_step_time: 1414ms, lr: 2.279051e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:50,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.65652 samples/s/p 1:07:54 } +2024-07-30 05:01:53,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 246/ 3125], loss: 0.103, per_step_time: 1413ms, lr: 2.2761533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:53,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.66117 samples/s/p 1:07:48 } +2024-07-30 05:01:56,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 248/ 3125], loss: 0.120, per_step_time: 1414ms, lr: 2.2732568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:56,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.65565 samples/s/p 1:07:49 } +2024-07-30 05:01:59,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 250/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 2.2703616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:59,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.66092 samples/s/p 1:07:42 } +2024-07-30 05:02:01,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 252/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 2.2674667e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:01,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.66072 samples/s/p 1:07:40 } +2024-07-30 05:02:04,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 254/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 2.2645745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:04,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.65982 samples/s/p 1:07:38 } +2024-07-30 05:02:07,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 256/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 2.261682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:07,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.65885 samples/s/p 1:07:35 } +2024-07-30 05:02:10,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 258/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 2.2587922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:10,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.65997 samples/s/p 1:07:32 } +2024-07-30 05:02:13,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 260/ 3125], loss: 0.128, per_step_time: 1412ms, lr: 2.2559038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:13,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.66278 samples/s/p 1:07:27 } +2024-07-30 05:02:16,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 262/ 3125], loss: 0.442, per_step_time: 1415ms, lr: 2.2530164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:16,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.65287 samples/s/p 1:07:31 } +2024-07-30 05:02:18,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 264/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 2.2501304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:18,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.65847 samples/s/p 1:07:24 } +2024-07-30 05:02:21,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 266/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 2.247246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:21,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.66079 samples/s/p 1:07:20 } +2024-07-30 05:02:24,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 268/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 2.2443626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:24,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.66003 samples/s/p 1:07:18 } +2024-07-30 05:02:27,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 270/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 2.2414795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:27,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.66031 samples/s/p 1:07:15 } +2024-07-30 05:02:30,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 272/ 3125], loss: 0.448, per_step_time: 1413ms, lr: 2.2385987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:30,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.65997 samples/s/p 1:07:12 } +2024-07-30 05:02:33,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 274/ 3125], loss: 0.139, per_step_time: 1413ms, lr: 2.2357194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:33,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.66126 samples/s/p 1:07:08 } +2024-07-30 05:02:35,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 276/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 2.2328406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:35,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.66069 samples/s/p 1:07:06 } +2024-07-30 05:02:38,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 278/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 2.2299637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:38,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.66048 samples/s/p 1:07:03 } +2024-07-30 05:02:41,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 280/ 3125], loss: 0.103, per_step_time: 1412ms, lr: 2.2270885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:41,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.66345 samples/s/p 1:06:58 } +2024-07-30 05:02:44,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 282/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 2.2242143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:44,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.65986 samples/s/p 1:06:58 } +2024-07-30 05:02:47,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 284/ 3125], loss: 0.123, per_step_time: 1413ms, lr: 2.2213417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:47,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.66003 samples/s/p 1:06:55 } +2024-07-30 05:02:50,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 286/ 3125], loss: 0.452, per_step_time: 1413ms, lr: 2.218469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:50,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.66070 samples/s/p 1:06:52 } +2024-07-30 05:02:52,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 288/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 2.2155987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:52,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.66095 samples/s/p 1:06:49 } +2024-07-30 05:02:55,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 290/ 3125], loss: 0.319, per_step_time: 1414ms, lr: 2.21273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:55,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.65466 samples/s/p 1:06:50 } +2024-07-30 05:02:58,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 292/ 3125], loss: 0.234, per_step_time: 1414ms, lr: 2.2098627e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:58,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.65606 samples/s/p 1:06:47 } +2024-07-30 05:03:01,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 294/ 3125], loss: 0.413, per_step_time: 1413ms, lr: 2.2069967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:01,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.66149 samples/s/p 1:06:40 } +2024-07-30 05:03:04,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 296/ 3125], loss: 0.140, per_step_time: 1412ms, lr: 2.2041309e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:04,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.66240 samples/s/p 1:06:36 } +2024-07-30 05:03:07,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 298/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 2.2012675e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:07,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.65947 samples/s/p 1:06:36 } +2024-07-30 05:03:09,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 300/ 3125], loss: 0.222, per_step_time: 1412ms, lr: 2.1984042e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:09,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.66208 samples/s/p 1:06:31 } +2024-07-30 05:03:12,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 302/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 2.1955436e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:12,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.66140 samples/s/p 1:06:29 } +2024-07-30 05:03:15,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 304/ 3125], loss: 0.106, per_step_time: 1413ms, lr: 2.192684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:15,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.65856 samples/s/p 1:06:28 } +2024-07-30 05:03:18,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 306/ 3125], loss: 0.305, per_step_time: 1416ms, lr: 2.189826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:18,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.64811 samples/s/p 1:06:32 } +2024-07-30 05:03:21,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 308/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 2.1869691e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:21,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.66157 samples/s/p 1:06:20 } +2024-07-30 05:03:24,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 310/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 2.1841138e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:24,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.66101 samples/s/p 1:06:18 } +2024-07-30 05:03:26,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 312/ 3125], loss: 0.106, per_step_time: 1414ms, lr: 2.18126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:26,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.65641 samples/s/p 1:06:18 } +2024-07-30 05:03:29,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 314/ 3125], loss: 0.510, per_step_time: 1413ms, lr: 2.178406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:29,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |███████████████████████████████████ | 5.65773 samples/s/p 1:06:14 } +2024-07-30 05:03:32,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 316/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 2.175555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:32,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |███████████████████████████████████ | 5.65852 samples/s/p 1:06:11 } +2024-07-30 05:03:35,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 318/ 3125], loss: 0.397, per_step_time: 1413ms, lr: 2.1727046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:35,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.66074 samples/s/p 1:06:06 } +2024-07-30 05:03:38,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 320/ 3125], loss: 0.451, per_step_time: 1412ms, lr: 2.1698552e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:38,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.66201 samples/s/p 1:06:03 } +2024-07-30 05:03:41,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 322/ 3125], loss: 0.272, per_step_time: 1414ms, lr: 2.1670078e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:41,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.65632 samples/s/p 1:06:04 } +2024-07-30 05:03:43,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 324/ 3125], loss: 0.444, per_step_time: 1413ms, lr: 2.1641617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:43,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.65947 samples/s/p 1:05:59 } +2024-07-30 05:03:46,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 326/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 2.161317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:46,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.65948 samples/s/p 1:05:56 } +2024-07-30 05:03:49,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 328/ 3125], loss: 0.163, per_step_time: 1412ms, lr: 2.158473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:49,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.66174 samples/s/p 1:05:52 } +2024-07-30 05:03:52,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 330/ 3125], loss: 0.258, per_step_time: 1412ms, lr: 2.1556311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:52,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.66395 samples/s/p 1:05:47 } +2024-07-30 05:03:55,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 332/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 2.1527903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:55,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.66053 samples/s/p 1:05:47 } +2024-07-30 05:03:58,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 334/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 2.1499513e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:58,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.66103 samples/s/p 1:05:44 } +2024-07-30 05:04:00,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 336/ 3125], loss: 0.485, per_step_time: 1413ms, lr: 2.1471137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:00,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.66042 samples/s/p 1:05:41 } +2024-07-30 05:04:03,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 338/ 3125], loss: 0.426, per_step_time: 1413ms, lr: 2.144277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:03,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.65912 samples/s/p 1:05:39 } +2024-07-30 05:04:06,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 340/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 2.141441e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:06,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.66076 samples/s/p 1:05:35 } +2024-07-30 05:04:09,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 342/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 2.1386072e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:09,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.66152 samples/s/p 1:05:32 } +2024-07-30 05:04:12,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 344/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 2.135774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:12,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.65919 samples/s/p 1:05:31 } +2024-07-30 05:04:15,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 346/ 3125], loss: 0.262, per_step_time: 1414ms, lr: 2.1329429e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:15,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.65629 samples/s/p 1:05:30 } +2024-07-30 05:04:17,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 348/ 3125], loss: 0.314, per_step_time: 1414ms, lr: 2.1301134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:17,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.65608 samples/s/p 1:05:27 } +2024-07-30 05:04:20,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 350/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 2.127285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:20,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.65914 samples/s/p 1:05:22 } +2024-07-30 05:04:23,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 352/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 2.1244582e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:23,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.66033 samples/s/p 1:05:19 } +2024-07-30 05:04:26,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 354/ 3125], loss: 0.058, per_step_time: 1413ms, lr: 2.1216326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:26,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.66040 samples/s/p 1:05:16 } +2024-07-30 05:04:29,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 356/ 3125], loss: 0.377, per_step_time: 1413ms, lr: 2.1188087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:29,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.66033 samples/s/p 1:05:13 } +2024-07-30 05:04:32,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 358/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 2.115985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:32,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.66158 samples/s/p 1:05:09 } +2024-07-30 05:04:34,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 360/ 3125], loss: 0.197, per_step_time: 1413ms, lr: 2.1131634e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:34,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.65822 samples/s/p 1:05:09 } +2024-07-30 05:04:37,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 362/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 2.1103435e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:37,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.65931 samples/s/p 1:05:05 } +2024-07-30 05:04:40,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 364/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 2.1075239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:40,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.66164 samples/s/p 1:05:01 } +2024-07-30 05:04:43,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 366/ 3125], loss: 0.134, per_step_time: 1412ms, lr: 2.1047065e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:43,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.66266 samples/s/p 1:04:57 } +2024-07-30 05:04:46,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 368/ 3125], loss: 0.405, per_step_time: 1413ms, lr: 2.1018907e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:46,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.66024 samples/s/p 1:04:56 } +2024-07-30 05:04:49,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 370/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 2.0990763e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:49,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.66080 samples/s/p 1:04:53 } +2024-07-30 05:04:51,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 372/ 3125], loss: 0.299, per_step_time: 1412ms, lr: 2.0962623e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:51,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.66230 samples/s/p 1:04:49 } +2024-07-30 05:04:54,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 374/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 2.0934503e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:54,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.66154 samples/s/p 1:04:47 } +2024-07-30 05:04:57,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 376/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 2.09064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:57,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.65955 samples/s/p 1:04:45 } +2024-07-30 05:05:00,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 378/ 3125], loss: 0.187, per_step_time: 1412ms, lr: 2.087831e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:00,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.66230 samples/s/p 1:04:41 } +2024-07-30 05:05:03,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 380/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 2.0850239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:03,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.65820 samples/s/p 1:04:41 } +2024-07-30 05:05:06,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 382/ 3125], loss: 0.296, per_step_time: 1412ms, lr: 2.0822176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:06,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.66184 samples/s/p 1:04:35 } +2024-07-30 05:05:08,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 384/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 2.079413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:08,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.66050 samples/s/p 1:04:33 } +2024-07-30 05:05:11,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 386/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 2.076608e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:11,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.65792 samples/s/p 1:04:32 } +2024-07-30 05:05:14,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 388/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 2.0738055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:14,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.65937 samples/s/p 1:04:28 } +2024-07-30 05:05:17,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 390/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 2.0710047e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:17,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.66076 samples/s/p 1:04:25 } +2024-07-30 05:05:20,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 392/ 3125], loss: 0.240, per_step_time: 1414ms, lr: 2.0682057e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:20,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.65583 samples/s/p 1:04:25 } +2024-07-30 05:05:23,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 394/ 3125], loss: 0.306, per_step_time: 1416ms, lr: 2.065408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:23,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.64916 samples/s/p 1:04:27 } +2024-07-30 05:05:26,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 396/ 3125], loss: 0.127, per_step_time: 1413ms, lr: 2.0626114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:26,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.65782 samples/s/p 1:04:18 } +2024-07-30 05:05:28,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 398/ 3125], loss: 0.328, per_step_time: 1414ms, lr: 2.0598168e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:28,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.65765 samples/s/p 1:04:16 } +2024-07-30 05:05:31,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 400/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 2.0570221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:31,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.66013 samples/s/p 1:04:11 } +2024-07-30 05:05:34,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 402/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 2.05423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:34,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.66144 samples/s/p 1:04:07 } +2024-07-30 05:05:37,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 404/ 3125], loss: 0.255, per_step_time: 1412ms, lr: 2.051439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:37,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.66215 samples/s/p 1:04:04 } +2024-07-30 05:05:40,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 406/ 3125], loss: 0.152, per_step_time: 1412ms, lr: 2.0486498e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:40,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.66201 samples/s/p 1:04:01 } +2024-07-30 05:05:43,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 408/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 2.0458617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:43,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.66155 samples/s/p 1:03:59 } +2024-07-30 05:05:45,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 410/ 3125], loss: 0.260, per_step_time: 1412ms, lr: 2.0430743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:45,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.66289 samples/s/p 1:03:55 } +2024-07-30 05:05:48,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 412/ 3125], loss: 0.390, per_step_time: 1415ms, lr: 2.0402892e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:48,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.65257 samples/s/p 1:03:59 } +2024-07-30 05:05:51,513 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 414/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 2.0375046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:51,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.66100 samples/s/p 1:03:51 } +2024-07-30 05:05:54,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 416/ 3125], loss: 0.178, per_step_time: 1412ms, lr: 2.0347222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:54,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.66175 samples/s/p 1:03:47 } +2024-07-30 05:05:57,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 418/ 3125], loss: 0.521, per_step_time: 1413ms, lr: 2.0319414e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:57,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.65808 samples/s/p 1:03:47 } +2024-07-30 05:06:00,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 420/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 2.029162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:00,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.66110 samples/s/p 1:03:42 } +2024-07-30 05:06:02,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 422/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 2.0263842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:02,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.66050 samples/s/p 1:03:40 } +2024-07-30 05:06:05,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 424/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 2.023607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:05,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.65829 samples/s/p 1:03:38 } +2024-07-30 05:06:08,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 426/ 3125], loss: 0.164, per_step_time: 1413ms, lr: 2.0208322e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:08,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.65908 samples/s/p 1:03:35 } +2024-07-30 05:06:11,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 428/ 3125], loss: 0.118, per_step_time: 1413ms, lr: 2.0180582e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:11,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.65815 samples/s/p 1:03:33 } +2024-07-30 05:06:14,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 430/ 3125], loss: 0.393, per_step_time: 1414ms, lr: 2.0152852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:14,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.65743 samples/s/p 1:03:30 } +2024-07-30 05:06:17,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 432/ 3125], loss: 0.254, per_step_time: 1414ms, lr: 2.0125142e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:17,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.65374 samples/s/p 1:03:30 } +2024-07-30 05:06:19,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 434/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 2.0097436e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:19,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.66141 samples/s/p 1:03:22 } +2024-07-30 05:06:22,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 436/ 3125], loss: 0.236, per_step_time: 1412ms, lr: 2.0069756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:22,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.66213 samples/s/p 1:03:19 } +2024-07-30 05:06:25,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 438/ 3125], loss: 0.169, per_step_time: 1412ms, lr: 2.0042091e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:25,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.66199 samples/s/p 1:03:16 } +2024-07-30 05:06:28,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 440/ 3125], loss: 0.332, per_step_time: 1414ms, lr: 2.0014438e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:28,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.65662 samples/s/p 1:03:17 } +2024-07-30 05:06:31,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 442/ 3125], loss: 0.359, per_step_time: 1414ms, lr: 1.9986799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:31,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.65691 samples/s/p 1:03:14 } +2024-07-30 05:06:34,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 444/ 3125], loss: 0.249, per_step_time: 1414ms, lr: 1.9959166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:34,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.65679 samples/s/p 1:03:11 } +2024-07-30 05:06:36,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 446/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 1.9931558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:36,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.66062 samples/s/p 1:03:06 } +2024-07-30 05:06:39,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 448/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 1.9903964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:39,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.66013 samples/s/p 1:03:03 } +2024-07-30 05:06:42,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 450/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 1.9876384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:42,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.66156 samples/s/p 1:02:59 } +2024-07-30 05:06:45,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 452/ 3125], loss: 0.185, per_step_time: 1412ms, lr: 1.9848817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:45,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.66192 samples/s/p 1:02:56 } +2024-07-30 05:06:48,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 454/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 1.9821257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:48,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.66127 samples/s/p 1:02:54 } +2024-07-30 05:06:51,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 456/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 1.9793717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:51,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.66125 samples/s/p 1:02:51 } +2024-07-30 05:06:53,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 458/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 1.9766185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:53,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.65984 samples/s/p 1:02:49 } +2024-07-30 05:06:56,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 460/ 3125], loss: 0.338, per_step_time: 1415ms, lr: 1.9738677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:56,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.65257 samples/s/p 1:02:51 } +2024-07-30 05:06:59,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 462/ 3125], loss: 0.385, per_step_time: 1413ms, lr: 1.9711183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:59,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.65820 samples/s/p 1:02:45 } +2024-07-30 05:07:02,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 464/ 3125], loss: 0.441, per_step_time: 1413ms, lr: 1.9683703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:02,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.65939 samples/s/p 1:02:41 } +2024-07-30 05:07:05,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 466/ 3125], loss: 0.331, per_step_time: 1414ms, lr: 1.965624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:05,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.65687 samples/s/p 1:02:40 } +2024-07-30 05:07:08,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 468/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 1.962879e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:08,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.65862 samples/s/p 1:02:36 } +2024-07-30 05:07:10,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 470/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 1.9601353e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:10,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.65912 samples/s/p 1:02:33 } +2024-07-30 05:07:13,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 472/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 1.9573924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:13,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.65809 samples/s/p 1:02:31 } +2024-07-30 05:07:16,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 474/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 1.9546515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:16,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.66090 samples/s/p 1:02:26 } +2024-07-30 05:07:19,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 476/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 1.9519123e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:19,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.66151 samples/s/p 1:02:23 } +2024-07-30 05:07:22,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 478/ 3125], loss: 0.275, per_step_time: 1412ms, lr: 1.9491736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:22,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.66325 samples/s/p 1:02:19 } +2024-07-30 05:07:25,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 480/ 3125], loss: 0.237, per_step_time: 1412ms, lr: 1.9464371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:25,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.66236 samples/s/p 1:02:16 } +2024-07-30 05:07:27,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 482/ 3125], loss: 0.415, per_step_time: 1413ms, lr: 1.9437023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:27,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.66055 samples/s/p 1:02:15 } +2024-07-30 05:07:30,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 484/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 1.9409688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:30,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.65899 samples/s/p 1:02:13 } +2024-07-30 05:07:33,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 486/ 3125], loss: 0.109, per_step_time: 1413ms, lr: 1.938237e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:33,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.66169 samples/s/p 1:02:08 } +2024-07-30 05:07:36,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 488/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 1.9355055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:36,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.65989 samples/s/p 1:02:07 } +2024-07-30 05:07:39,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 490/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 1.9327765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:39,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.66107 samples/s/p 1:02:03 } +2024-07-30 05:07:42,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 492/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 1.930049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:42,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.66015 samples/s/p 1:02:01 } +2024-07-30 05:07:44,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 494/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 1.9273227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:44,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.66133 samples/s/p 1:01:57 } +2024-07-30 05:07:47,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 496/ 3125], loss: 0.438, per_step_time: 1413ms, lr: 1.924598e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:47,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |███████████████████████████████████ | 5.65928 samples/s/p 1:01:56 } +2024-07-30 05:07:50,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 498/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 1.9218742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:50,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |███████████████████████████████████ | 5.65892 samples/s/p 1:01:53 } +2024-07-30 05:07:53,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 500/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 1.9191523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:53,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.66063 samples/s/p 1:01:49 } +2024-07-30 05:07:56,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 502/ 3125], loss: 0.083, per_step_time: 1415ms, lr: 1.916431e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:56,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.65277 samples/s/p 1:01:52 } +2024-07-30 05:07:59,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 504/ 3125], loss: 0.214, per_step_time: 1414ms, lr: 1.9137126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:59,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.65730 samples/s/p 1:01:46 } +2024-07-30 05:08:01,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 506/ 3125], loss: 0.513, per_step_time: 1413ms, lr: 1.9109953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:01,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.65817 samples/s/p 1:01:42 } +2024-07-30 05:08:04,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 508/ 3125], loss: 0.122, per_step_time: 1418ms, lr: 1.9082795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:04,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.63929 samples/s/p 1:01:52 } +2024-07-30 05:08:07,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 510/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 1.9055652e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:07,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.66012 samples/s/p 1:01:36 } +2024-07-30 05:08:10,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 512/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 1.9028523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:10,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.65924 samples/s/p 1:01:33 } +2024-07-30 05:08:13,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 514/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 1.9001409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:13,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.66107 samples/s/p 1:01:29 } +2024-07-30 05:08:16,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 516/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 1.89743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:16,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.66018 samples/s/p 1:01:27 } +2024-07-30 05:08:18,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 518/ 3125], loss: 0.083, per_step_time: 1413ms, lr: 1.8947217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:18,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.65799 samples/s/p 1:01:26 } +2024-07-30 05:08:21,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 520/ 3125], loss: 0.139, per_step_time: 1415ms, lr: 1.8920147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:21,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.65000 samples/s/p 1:01:28 } +2024-07-30 05:08:24,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 522/ 3125], loss: 0.269, per_step_time: 1414ms, lr: 1.8893084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:24,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.65745 samples/s/p 1:01:20 } +2024-07-30 05:08:27,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 524/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 1.8866044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:27,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.65976 samples/s/p 1:01:16 } +2024-07-30 05:08:30,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 526/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 1.8839019e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:30,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.65774 samples/s/p 1:01:14 } +2024-07-30 05:08:33,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 528/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 1.8812009e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:33,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.65941 samples/s/p 1:01:11 } +2024-07-30 05:08:35,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 530/ 3125], loss: 0.005, per_step_time: 1412ms, lr: 1.8785005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:35,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.66340 samples/s/p 1:01:05 } +2024-07-30 05:08:38,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 532/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 1.8758026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:38,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.65817 samples/s/p 1:01:06 } +2024-07-30 05:08:41,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 534/ 3125], loss: 0.209, per_step_time: 1412ms, lr: 1.873106e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:41,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.66206 samples/s/p 1:01:00 } +2024-07-30 05:08:44,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 536/ 3125], loss: 0.301, per_step_time: 1413ms, lr: 1.870411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:44,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.65891 samples/s/p 1:01:00 } +2024-07-30 05:08:47,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 538/ 3125], loss: 0.510, per_step_time: 1413ms, lr: 1.8677174e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:47,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.66077 samples/s/p 1:00:56 } +2024-07-30 05:08:50,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 540/ 3125], loss: 0.125, per_step_time: 1414ms, lr: 1.8650254e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:50,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.65485 samples/s/p 1:00:57 } +2024-07-30 05:08:52,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 542/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 1.862334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:52,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.66030 samples/s/p 1:00:50 } +2024-07-30 05:08:55,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 544/ 3125], loss: 0.156, per_step_time: 1412ms, lr: 1.859645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:55,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.66172 samples/s/p 1:00:46 } +2024-07-30 05:08:58,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 546/ 3125], loss: 0.244, per_step_time: 1412ms, lr: 1.8569565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:58,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.66218 samples/s/p 1:00:43 } +2024-07-30 05:09:01,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 548/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 1.8542704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:01,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.66129 samples/s/p 1:00:41 } +2024-07-30 05:09:04,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 550/ 3125], loss: 0.340, per_step_time: 1412ms, lr: 1.8515858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:04,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.66196 samples/s/p 1:00:38 } +2024-07-30 05:09:07,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 552/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 1.8489027e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:07,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.66151 samples/s/p 1:00:35 } +2024-07-30 05:09:09,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 554/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 1.8462214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:09,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.66127 samples/s/p 1:00:33 } +2024-07-30 05:09:12,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 556/ 3125], loss: 0.197, per_step_time: 1413ms, lr: 1.8435412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:12,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.66103 samples/s/p 1:00:30 } +2024-07-30 05:09:15,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 558/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 1.8408629e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:15,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.66132 samples/s/p 1:00:27 } +2024-07-30 05:09:18,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 560/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 1.8381849e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:18,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.65724 samples/s/p 1:00:27 } +2024-07-30 05:09:21,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 562/ 3125], loss: 0.268, per_step_time: 1416ms, lr: 1.8355095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:21,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.64597 samples/s/p 1:00:31 } +2024-07-30 05:09:24,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 564/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 1.8328357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:24,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.66129 samples/s/p 1:00:18 } +2024-07-30 05:09:26,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 566/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 1.8301621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:26,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.66140 samples/s/p 1:00:16 } +2024-07-30 05:09:29,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 568/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 1.8274911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:29,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.65981 samples/s/p 1:00:14 } +2024-07-30 05:09:32,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 570/ 3125], loss: 0.294, per_step_time: 1413ms, lr: 1.8248218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:32,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.66039 samples/s/p 1:00:11 } +2024-07-30 05:09:35,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 572/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 1.8221535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:35,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.65921 samples/s/p 1:00:08 } +2024-07-30 05:09:38,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 574/ 3125], loss: 0.064, per_step_time: 1414ms, lr: 1.8194863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:38,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.65688 samples/s/p 1:00:07 } +2024-07-30 05:09:41,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 576/ 3125], loss: 0.174, per_step_time: 1414ms, lr: 1.8168216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:41,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.65759 samples/s/p 1:00:04 } +2024-07-30 05:09:43,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 578/ 3125], loss: 0.265, per_step_time: 1414ms, lr: 1.8141582e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:43,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.65392 samples/s/p 1:00:03 } +2024-07-30 05:09:46,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 580/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 1.8114963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:46,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.65945 samples/s/p 0:59:57 } +2024-07-30 05:09:49,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 582/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 1.8088361e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:49,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.65971 samples/s/p 0:59:54 } +2024-07-30 05:09:52,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 584/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 1.8061771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:52,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.66089 samples/s/p 0:59:50 } +2024-07-30 05:09:55,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 586/ 3125], loss: 0.202, per_step_time: 1414ms, lr: 1.8035188e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:55,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.65549 samples/s/p 0:59:51 } +2024-07-30 05:09:58,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 588/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 1.8008631e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:58,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.66020 samples/s/p 0:59:45 } +2024-07-30 05:10:00,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 590/ 3125], loss: 0.138, per_step_time: 1415ms, lr: 1.798208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:00,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.65244 samples/s/p 0:59:47 } +2024-07-30 05:10:03,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 592/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 1.7955554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:03,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.65853 samples/s/p 0:59:41 } +2024-07-30 05:10:06,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 594/ 3125], loss: 0.130, per_step_time: 1413ms, lr: 1.7929044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:06,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.65923 samples/s/p 0:59:37 } +2024-07-30 05:10:09,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 596/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 1.7902544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:09,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.66170 samples/s/p 0:59:33 } +2024-07-30 05:10:12,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 598/ 3125], loss: 0.323, per_step_time: 1413ms, lr: 1.7876064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:12,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.66131 samples/s/p 0:59:30 } +2024-07-30 05:10:15,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 600/ 3125], loss: 0.395, per_step_time: 1413ms, lr: 1.7849596e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:15,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.66086 samples/s/p 0:59:28 } +2024-07-30 05:10:17,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 602/ 3125], loss: 0.266, per_step_time: 1414ms, lr: 1.7823138e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:17,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.65637 samples/s/p 0:59:28 } +2024-07-30 05:10:20,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 604/ 3125], loss: 0.134, per_step_time: 1413ms, lr: 1.7796704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:20,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.65988 samples/s/p 0:59:23 } +2024-07-30 05:10:23,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 606/ 3125], loss: 0.142, per_step_time: 1413ms, lr: 1.7770287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:23,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.65878 samples/s/p 0:59:21 } +2024-07-30 05:10:26,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 608/ 3125], loss: 0.591, per_step_time: 1413ms, lr: 1.7743882e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:26,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.65841 samples/s/p 0:59:18 } +2024-07-30 05:10:29,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 610/ 3125], loss: 0.108, per_step_time: 1414ms, lr: 1.771748e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:29,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.65769 samples/s/p 0:59:16 } +2024-07-30 05:10:32,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 612/ 3125], loss: 0.229, per_step_time: 1415ms, lr: 1.7691108e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:32,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.65230 samples/s/p 0:59:16 } +2024-07-30 05:10:34,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 614/ 3125], loss: 0.111, per_step_time: 1412ms, lr: 1.7664751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:34,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.66304 samples/s/p 0:59:07 } +2024-07-30 05:10:37,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 616/ 3125], loss: 0.183, per_step_time: 1414ms, lr: 1.7638399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:37,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.65612 samples/s/p 0:59:08 } +2024-07-30 05:10:40,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 618/ 3125], loss: 0.164, per_step_time: 1413ms, lr: 1.7612073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:40,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.65985 samples/s/p 0:59:03 } +2024-07-30 05:10:43,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 620/ 3125], loss: 0.065, per_step_time: 1412ms, lr: 1.758576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:43,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.66240 samples/s/p 0:58:59 } +2024-07-30 05:10:46,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 622/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 1.7559465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:46,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.66134 samples/s/p 0:58:56 } +2024-07-30 05:10:49,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 624/ 3125], loss: 0.520, per_step_time: 1413ms, lr: 1.7533185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:49,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.66075 samples/s/p 0:58:54 } +2024-07-30 05:10:51,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 626/ 3125], loss: 0.100, per_step_time: 1412ms, lr: 1.750692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:51,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.66203 samples/s/p 0:58:50 } +2024-07-30 05:10:54,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 628/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 1.7480671e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:54,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.65946 samples/s/p 0:58:49 } +2024-07-30 05:10:57,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 630/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 1.7454427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:57,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.65951 samples/s/p 0:58:46 } +2024-07-30 05:11:00,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 632/ 3125], loss: 0.305, per_step_time: 1415ms, lr: 1.7428207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:00,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.65255 samples/s/p 0:58:48 } +2024-07-30 05:11:03,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 634/ 3125], loss: 0.278, per_step_time: 1415ms, lr: 1.7401995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:03,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.65220 samples/s/p 0:58:45 } +2024-07-30 05:11:06,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 636/ 3125], loss: 0.082, per_step_time: 1413ms, lr: 1.7375809e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:06,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.66148 samples/s/p 0:58:37 } +2024-07-30 05:11:08,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 638/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 1.7349636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:08,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.66005 samples/s/p 0:58:35 } +2024-07-30 05:11:11,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 640/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 1.7323479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:11,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.66046 samples/s/p 0:58:32 } +2024-07-30 05:11:14,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 642/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 1.7297339e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:14,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.66140 samples/s/p 0:58:28 } +2024-07-30 05:11:17,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 644/ 3125], loss: 0.400, per_step_time: 1413ms, lr: 1.7271215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:17,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.65976 samples/s/p 0:58:26 } +2024-07-30 05:11:20,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 646/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 1.7245095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:20,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.66164 samples/s/p 0:58:22 } +2024-07-30 05:11:23,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 648/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 1.7219004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:23,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.66087 samples/s/p 0:58:20 } +2024-07-30 05:11:25,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 650/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 1.7192924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:25,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.65955 samples/s/p 0:58:18 } +2024-07-30 05:11:28,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 652/ 3125], loss: 0.326, per_step_time: 1414ms, lr: 1.7166861e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:28,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.65655 samples/s/p 0:58:17 } +2024-07-30 05:11:31,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 654/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 1.7140806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:31,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.66077 samples/s/p 0:58:12 } +2024-07-30 05:11:34,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 656/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 1.7114774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:34,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.66034 samples/s/p 0:58:09 } +2024-07-30 05:11:37,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 658/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 1.7088759e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:37,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.66152 samples/s/p 0:58:05 } +2024-07-30 05:11:40,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 660/ 3125], loss: 0.120, per_step_time: 1412ms, lr: 1.706275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:40,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.66175 samples/s/p 0:58:03 } +2024-07-30 05:11:42,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 662/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 1.7036765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:42,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.66041 samples/s/p 0:58:01 } +2024-07-30 05:11:45,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 664/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 1.7010799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:45,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.65939 samples/s/p 0:57:58 } +2024-07-30 05:11:48,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 666/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 1.6984844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:48,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.66049 samples/s/p 0:57:55 } +2024-07-30 05:11:51,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 668/ 3125], loss: 0.145, per_step_time: 1413ms, lr: 1.695891e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:51,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.65873 samples/s/p 0:57:53 } +2024-07-30 05:11:54,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 670/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 1.6932988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:54,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.65791 samples/s/p 0:57:51 } +2024-07-30 05:11:57,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 672/ 3125], loss: 0.271, per_step_time: 1415ms, lr: 1.690708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:57,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.65066 samples/s/p 0:57:52 } +2024-07-30 05:11:59,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 674/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 1.6881182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:59,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.65989 samples/s/p 0:57:44 } +2024-07-30 05:12:02,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 676/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 1.6855311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:02,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.65775 samples/s/p 0:57:42 } +2024-07-30 05:12:05,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 678/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 1.6829442e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:05,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.66135 samples/s/p 0:57:37 } +2024-07-30 05:12:08,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 680/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 1.6803601e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:08,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.66078 samples/s/p 0:57:35 } +2024-07-30 05:12:11,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 682/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 1.6777774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:11,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.65774 samples/s/p 0:57:34 } +2024-07-30 05:12:14,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 684/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 1.6751966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:14,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |████████████████████████████████████ | 5.66115 samples/s/p 0:57:29 } +2024-07-30 05:12:16,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 686/ 3125], loss: 0.592, per_step_time: 1413ms, lr: 1.6726168e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:16,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |████████████████████████████████████ | 5.66106 samples/s/p 0:57:26 } +2024-07-30 05:12:19,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 688/ 3125], loss: 0.160, per_step_time: 1413ms, lr: 1.670038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:19,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.66073 samples/s/p 0:57:24 } +2024-07-30 05:12:22,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 690/ 3125], loss: 0.201, per_step_time: 1414ms, lr: 1.6674619e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:22,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.65702 samples/s/p 0:57:23 } +2024-07-30 05:12:25,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 692/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 1.6648873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:25,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.65955 samples/s/p 0:57:19 } +2024-07-30 05:12:28,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 694/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 1.6623145e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:28,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.66130 samples/s/p 0:57:15 } +2024-07-30 05:12:31,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 696/ 3125], loss: 0.287, per_step_time: 1412ms, lr: 1.6597429e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:31,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.66178 samples/s/p 0:57:12 } +2024-07-30 05:12:33,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 698/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 1.657173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:33,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.66112 samples/s/p 0:57:09 } +2024-07-30 05:12:36,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 700/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 1.6546037e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:36,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.65991 samples/s/p 0:57:07 } +2024-07-30 05:12:39,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 702/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 1.6520369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:39,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.65961 samples/s/p 0:57:04 } +2024-07-30 05:12:42,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 704/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 1.6494708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:42,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.65904 samples/s/p 0:57:02 } +2024-07-30 05:12:45,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 706/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 1.6469075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:45,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.65791 samples/s/p 0:57:00 } +2024-07-30 05:12:48,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 708/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 1.6443457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:48,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.66040 samples/s/p 0:56:56 } +2024-07-30 05:12:50,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 710/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 1.6417855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:50,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.65937 samples/s/p 0:56:53 } +2024-07-30 05:12:53,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 712/ 3125], loss: 0.073, per_step_time: 1413ms, lr: 1.6392266e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:53,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.65819 samples/s/p 0:56:51 } +2024-07-30 05:12:56,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 714/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 1.6366696e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:56,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.65997 samples/s/p 0:56:47 } +2024-07-30 05:12:59,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 716/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 1.6341144e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:59,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.65923 samples/s/p 0:56:45 } +2024-07-30 05:13:02,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 718/ 3125], loss: 0.419, per_step_time: 1413ms, lr: 1.6315594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:02,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.66157 samples/s/p 0:56:41 } +2024-07-30 05:13:05,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 720/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 1.6290071e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:05,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.65945 samples/s/p 0:56:39 } +2024-07-30 05:13:07,991 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 722/ 3125], loss: 0.433, per_step_time: 1413ms, lr: 1.6264567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:07,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.66032 samples/s/p 0:56:36 } +2024-07-30 05:13:10,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 724/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 1.6239064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:10,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.65787 samples/s/p 0:56:34 } +2024-07-30 05:13:13,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 726/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 1.6213589e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:13,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.65781 samples/s/p 0:56:32 } +2024-07-30 05:13:16,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 728/ 3125], loss: 0.267, per_step_time: 1414ms, lr: 1.6188135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:16,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.65767 samples/s/p 0:56:29 } +2024-07-30 05:13:19,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 730/ 3125], loss: 0.191, per_step_time: 1412ms, lr: 1.6162691e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:19,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.66217 samples/s/p 0:56:23 } +2024-07-30 05:13:22,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 732/ 3125], loss: 0.114, per_step_time: 1413ms, lr: 1.6137257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:22,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.66045 samples/s/p 0:56:22 } +2024-07-30 05:13:24,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 734/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 1.6111848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:24,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.65818 samples/s/p 0:56:20 } +2024-07-30 05:13:27,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 736/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 1.6086453e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:27,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.65875 samples/s/p 0:56:17 } +2024-07-30 05:13:30,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 738/ 3125], loss: 0.389, per_step_time: 1414ms, lr: 1.6061076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:30,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.65682 samples/s/p 0:56:15 } +2024-07-30 05:13:33,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 740/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 1.6035715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:33,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.65886 samples/s/p 0:56:11 } +2024-07-30 05:13:36,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 742/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 1.6010371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:36,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.66053 samples/s/p 0:56:07 } +2024-07-30 05:13:39,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 744/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 1.5985032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:39,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.66080 samples/s/p 0:56:04 } +2024-07-30 05:13:42,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 746/ 3125], loss: 0.112, per_step_time: 1413ms, lr: 1.5959721e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:42,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.66076 samples/s/p 0:56:02 } +2024-07-30 05:13:44,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 748/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 1.5934413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:44,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.66045 samples/s/p 0:55:59 } +2024-07-30 05:13:47,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 750/ 3125], loss: 0.348, per_step_time: 1412ms, lr: 1.5909135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:47,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.66192 samples/s/p 0:55:55 } +2024-07-30 05:13:47,670 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 05:14:24,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 752/ 3125], loss: 0.167, per_step_time: 3212ms, lr: 1.5883871e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:24,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 2.49056 samples/s/p 2:07:02 } +2024-07-30 05:14:26,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 754/ 3125], loss: 0.306, per_step_time: 1414ms, lr: 1.5858626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:26,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.65616 samples/s/p 0:55:53 } +2024-07-30 05:14:29,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 756/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 1.5833392e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:29,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.66043 samples/s/p 0:55:48 } +2024-07-30 05:14:32,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 758/ 3125], loss: 0.194, per_step_time: 1414ms, lr: 1.5808176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:32,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.65485 samples/s/p 0:55:48 } +2024-07-30 05:14:35,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 760/ 3125], loss: 0.140, per_step_time: 1415ms, lr: 1.5782979e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:35,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.65123 samples/s/p 0:55:47 } +2024-07-30 05:14:38,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 762/ 3125], loss: 0.289, per_step_time: 1414ms, lr: 1.5757787e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:38,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.65443 samples/s/p 0:55:43 } +2024-07-30 05:14:41,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 764/ 3125], loss: 0.270, per_step_time: 1412ms, lr: 1.5732625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:41,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.66177 samples/s/p 0:55:36 } +2024-07-30 05:14:44,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 766/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 1.5707475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:44,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.66136 samples/s/p 0:55:33 } +2024-07-30 05:14:47,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 768/ 3125], loss: 0.225, per_step_time: 1416ms, lr: 1.5682333e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:47,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.64609 samples/s/p 0:55:39 } +2024-07-30 05:14:50,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 770/ 3125], loss: 0.351, per_step_time: 1412ms, lr: 1.5657216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:50,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.66184 samples/s/p 0:55:27 } +2024-07-30 05:14:53,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 772/ 3125], loss: 0.538, per_step_time: 1414ms, lr: 1.5632113e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:53,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.65712 samples/s/p 0:55:27 } +2024-07-30 05:14:55,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 774/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 1.5607031e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:55,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.65986 samples/s/p 0:55:23 } +2024-07-30 05:14:58,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 776/ 3125], loss: 0.176, per_step_time: 1412ms, lr: 1.5581957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:58,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.66172 samples/s/p 0:55:19 } +2024-07-30 05:15:01,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 778/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 1.5556905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:01,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.65958 samples/s/p 0:55:17 } +2024-07-30 05:15:04,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 780/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 1.5531871e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:04,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.65886 samples/s/p 0:55:15 } +2024-07-30 05:15:07,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 782/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 1.5506852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:07,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.66055 samples/s/p 0:55:11 } +2024-07-30 05:15:10,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 784/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 1.548185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:10,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.66007 samples/s/p 0:55:08 } +2024-07-30 05:15:13,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 786/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 1.5456867e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:13,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.65940 samples/s/p 0:55:06 } +2024-07-30 05:15:16,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 788/ 3125], loss: 0.313, per_step_time: 1414ms, lr: 1.543189e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:16,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.65571 samples/s/p 0:55:05 } +2024-07-30 05:15:19,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 790/ 3125], loss: 0.309, per_step_time: 1414ms, lr: 1.5406936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:19,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.65443 samples/s/p 0:55:03 } +2024-07-30 05:15:22,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 792/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 1.5381992e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:22,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.65838 samples/s/p 0:54:58 } +2024-07-30 05:15:24,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 794/ 3125], loss: 0.405, per_step_time: 1413ms, lr: 1.5357074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:24,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.65931 samples/s/p 0:54:55 } +2024-07-30 05:15:27,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 796/ 3125], loss: 0.059, per_step_time: 1414ms, lr: 1.5332171e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:27,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.65393 samples/s/p 0:54:55 } +2024-07-30 05:15:30,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 798/ 3125], loss: 0.459, per_step_time: 1415ms, lr: 1.5307284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:30,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.65361 samples/s/p 0:54:52 } +2024-07-30 05:15:33,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 800/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 1.5282416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:33,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.65804 samples/s/p 0:54:47 } +2024-07-30 05:15:36,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 802/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 1.525756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:36,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.66017 samples/s/p 0:54:43 } +2024-07-30 05:15:39,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 804/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 1.5232717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:39,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.65952 samples/s/p 0:54:40 } +2024-07-30 05:15:42,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 806/ 3125], loss: 0.378, per_step_time: 1412ms, lr: 1.5207895e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:42,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.66176 samples/s/p 0:54:36 } +2024-07-30 05:15:44,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 808/ 3125], loss: 0.235, per_step_time: 1414ms, lr: 1.5183094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:44,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.65466 samples/s/p 0:54:38 } +2024-07-30 05:15:47,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 810/ 3125], loss: 0.235, per_step_time: 1413ms, lr: 1.5158307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:47,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.66010 samples/s/p 0:54:32 } +2024-07-30 05:15:50,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 812/ 3125], loss: 0.385, per_step_time: 1413ms, lr: 1.5133529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:50,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.66089 samples/s/p 0:54:28 } +2024-07-30 05:15:53,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 814/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 1.5108776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:53,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.65982 samples/s/p 0:54:26 } +2024-07-30 05:15:56,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 816/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 1.508404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:56,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.65858 samples/s/p 0:54:24 } +2024-07-30 05:15:59,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 818/ 3125], loss: 0.181, per_step_time: 1418ms, lr: 1.5059313e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:59,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.63902 samples/s/p 0:54:32 } +2024-07-30 05:16:01,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 820/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 1.5034607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:01,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.66061 samples/s/p 0:54:17 } +2024-07-30 05:16:04,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 822/ 3125], loss: 0.343, per_step_time: 1415ms, lr: 1.5009921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:04,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.65121 samples/s/p 0:54:20 } +2024-07-30 05:16:07,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 824/ 3125], loss: 0.420, per_step_time: 1413ms, lr: 1.4985251e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:07,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.66111 samples/s/p 0:54:11 } +2024-07-30 05:16:10,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 826/ 3125], loss: 0.120, per_step_time: 1415ms, lr: 1.4960599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:10,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.65363 samples/s/p 0:54:13 } +2024-07-30 05:16:13,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 828/ 3125], loss: 0.141, per_step_time: 1415ms, lr: 1.4935964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:13,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.65017 samples/s/p 0:54:12 } +2024-07-30 05:16:16,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 830/ 3125], loss: 0.413, per_step_time: 1414ms, lr: 1.4911344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:16,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.65476 samples/s/p 0:54:06 } +2024-07-30 05:16:18,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 832/ 3125], loss: 0.234, per_step_time: 1414ms, lr: 1.4886731e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:18,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.65390 samples/s/p 0:54:04 } +2024-07-30 05:16:21,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 834/ 3125], loss: 0.438, per_step_time: 1412ms, lr: 1.4862144e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:21,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.66351 samples/s/p 0:53:56 } +2024-07-30 05:16:24,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 836/ 3125], loss: 0.238, per_step_time: 1412ms, lr: 1.4837568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:24,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.66276 samples/s/p 0:53:53 } +2024-07-30 05:16:27,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 838/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 1.4813014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:27,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.66121 samples/s/p 0:53:51 } +2024-07-30 05:16:30,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 840/ 3125], loss: 0.145, per_step_time: 1413ms, lr: 1.4788482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:30,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.65867 samples/s/p 0:53:50 } +2024-07-30 05:16:33,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 842/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 1.4763963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:33,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.65938 samples/s/p 0:53:47 } +2024-07-30 05:16:35,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 844/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 1.473946e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:35,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.65858 samples/s/p 0:53:44 } +2024-07-30 05:16:38,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 846/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 1.4714974e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:38,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.66033 samples/s/p 0:53:41 } +2024-07-30 05:16:41,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 848/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 1.4690497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:41,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.66087 samples/s/p 0:53:37 } +2024-07-30 05:16:44,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 850/ 3125], loss: 0.104, per_step_time: 1413ms, lr: 1.4666044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:44,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.66021 samples/s/p 0:53:35 } +2024-07-30 05:16:47,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 852/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 1.4641612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:47,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.66061 samples/s/p 0:53:32 } +2024-07-30 05:16:50,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 854/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 1.4617192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:50,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.65990 samples/s/p 0:53:29 } +2024-07-30 05:16:52,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 856/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 1.4592785e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:52,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.65971 samples/s/p 0:53:27 } +2024-07-30 05:16:55,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 858/ 3125], loss: 0.118, per_step_time: 1414ms, lr: 1.45684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:55,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.65652 samples/s/p 0:53:26 } +2024-07-30 05:16:58,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 860/ 3125], loss: 0.421, per_step_time: 1415ms, lr: 1.4544033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:58,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.65144 samples/s/p 0:53:26 } +2024-07-30 05:17:01,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 862/ 3125], loss: 0.449, per_step_time: 1413ms, lr: 1.4519674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:01,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.65804 samples/s/p 0:53:19 } +2024-07-30 05:17:04,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 864/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 1.4495342e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:04,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.66162 samples/s/p 0:53:14 } +2024-07-30 05:17:07,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 866/ 3125], loss: 0.387, per_step_time: 1415ms, lr: 1.4471024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:07,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.65252 samples/s/p 0:53:17 } +2024-07-30 05:17:09,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 868/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 1.4446726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:09,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.65821 samples/s/p 0:53:11 } +2024-07-30 05:17:12,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 870/ 3125], loss: 0.101, per_step_time: 1416ms, lr: 1.4422443e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:12,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.64875 samples/s/p 0:53:13 } +2024-07-30 05:17:15,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 872/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 1.4398178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:15,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |█████████████████████████████████████ | 5.66049 samples/s/p 0:53:04 } +2024-07-30 05:17:18,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 874/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 1.4373928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:18,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |█████████████████████████████████████ | 5.66033 samples/s/p 0:53:01 } +2024-07-30 05:17:21,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 876/ 3125], loss: 0.184, per_step_time: 1412ms, lr: 1.434969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:21,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.66230 samples/s/p 0:52:57 } +2024-07-30 05:17:24,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 878/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 1.4325475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:24,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.65980 samples/s/p 0:52:56 } +2024-07-30 05:17:26,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 880/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 1.430127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:26,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.66126 samples/s/p 0:52:52 } +2024-07-30 05:17:29,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 882/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 1.4277089e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:29,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.66037 samples/s/p 0:52:50 } +2024-07-30 05:17:32,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 884/ 3125], loss: 0.320, per_step_time: 1413ms, lr: 1.4252928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:32,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.66042 samples/s/p 0:52:47 } +2024-07-30 05:17:35,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 886/ 3125], loss: 0.484, per_step_time: 1413ms, lr: 1.4228782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:35,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.66079 samples/s/p 0:52:44 } +2024-07-30 05:17:38,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 888/ 3125], loss: 0.222, per_step_time: 1414ms, lr: 1.4204651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:38,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.65607 samples/s/p 0:52:44 } +2024-07-30 05:17:41,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 890/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 1.4180529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:41,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.66107 samples/s/p 0:52:38 } +2024-07-30 05:17:43,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 892/ 3125], loss: 0.288, per_step_time: 1414ms, lr: 1.4156436e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:43,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.65554 samples/s/p 0:52:38 } +2024-07-30 05:17:46,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 894/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 1.413236e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:46,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.65800 samples/s/p 0:52:34 } +2024-07-30 05:17:49,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 896/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 1.41083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:49,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.66015 samples/s/p 0:52:30 } +2024-07-30 05:17:52,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 898/ 3125], loss: 0.380, per_step_time: 1413ms, lr: 1.4084255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:52,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.66043 samples/s/p 0:52:27 } +2024-07-30 05:17:55,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 900/ 3125], loss: 0.492, per_step_time: 1413ms, lr: 1.406022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:55,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.65842 samples/s/p 0:52:25 } +2024-07-30 05:17:58,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 902/ 3125], loss: 0.128, per_step_time: 1414ms, lr: 1.4036211e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:58,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.65633 samples/s/p 0:52:24 } +2024-07-30 05:18:00,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 904/ 3125], loss: 0.187, per_step_time: 1418ms, lr: 1.401222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:00,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.63840 samples/s/p 0:52:31 } +2024-07-30 05:18:03,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 906/ 3125], loss: 0.287, per_step_time: 1414ms, lr: 1.3988235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:03,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.65378 samples/s/p 0:52:19 } +2024-07-30 05:18:06,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 908/ 3125], loss: 0.194, per_step_time: 1414ms, lr: 1.396428e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:06,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.65668 samples/s/p 0:52:15 } +2024-07-30 05:18:09,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 910/ 3125], loss: 0.370, per_step_time: 1414ms, lr: 1.3940337e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:09,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.65732 samples/s/p 0:52:12 } +2024-07-30 05:18:12,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 912/ 3125], loss: 0.139, per_step_time: 1414ms, lr: 1.3916415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:12,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.65687 samples/s/p 0:52:09 } +2024-07-30 05:18:15,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 914/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 1.389251e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:15,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.66020 samples/s/p 0:52:04 } +2024-07-30 05:18:17,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 916/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 1.3868621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:17,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.65953 samples/s/p 0:52:02 } +2024-07-30 05:18:20,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 918/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 1.3844749e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:20,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.66139 samples/s/p 0:51:58 } +2024-07-30 05:18:23,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 920/ 3125], loss: 0.399, per_step_time: 1413ms, lr: 1.3820886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:23,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.66040 samples/s/p 0:51:56 } +2024-07-30 05:18:26,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 922/ 3125], loss: 0.454, per_step_time: 1413ms, lr: 1.379705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:26,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.66129 samples/s/p 0:51:53 } +2024-07-30 05:18:29,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 924/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 1.3773221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:29,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.66019 samples/s/p 0:51:50 } +2024-07-30 05:18:32,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 926/ 3125], loss: 0.270, per_step_time: 1412ms, lr: 1.374942e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:32,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.66211 samples/s/p 0:51:46 } +2024-07-30 05:18:34,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 928/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 1.3725635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:34,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.65962 samples/s/p 0:51:45 } +2024-07-30 05:18:37,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 930/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 1.3701865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:37,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.66035 samples/s/p 0:51:42 } +2024-07-30 05:18:40,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 932/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 1.3678115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:40,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.65941 samples/s/p 0:51:39 } +2024-07-30 05:18:43,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 934/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 1.3654375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:43,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.65842 samples/s/p 0:51:37 } +2024-07-30 05:18:46,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 936/ 3125], loss: 0.172, per_step_time: 1414ms, lr: 1.3630661e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:46,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.65686 samples/s/p 0:51:35 } +2024-07-30 05:18:49,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 938/ 3125], loss: 0.381, per_step_time: 1414ms, lr: 1.3606963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:49,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.65674 samples/s/p 0:51:32 } +2024-07-30 05:18:51,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 940/ 3125], loss: 0.368, per_step_time: 1413ms, lr: 1.3583282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:51,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.65851 samples/s/p 0:51:29 } +2024-07-30 05:18:54,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 942/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 1.3559616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:54,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.66040 samples/s/p 0:51:25 } +2024-07-30 05:18:57,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 944/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 1.3535961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:57,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.65824 samples/s/p 0:51:23 } +2024-07-30 05:19:00,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 946/ 3125], loss: 0.322, per_step_time: 1413ms, lr: 1.3512334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:00,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.66096 samples/s/p 0:51:19 } +2024-07-30 05:19:03,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 948/ 3125], loss: 0.154, per_step_time: 1412ms, lr: 1.3488716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:03,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.66222 samples/s/p 0:51:15 } +2024-07-30 05:19:06,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 950/ 3125], loss: 0.323, per_step_time: 1417ms, lr: 1.3465121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:06,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.64193 samples/s/p 0:51:24 } +2024-07-30 05:19:08,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 952/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 1.3441542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:08,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.65920 samples/s/p 0:51:11 } +2024-07-30 05:19:11,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 954/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 1.3417986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:11,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.65978 samples/s/p 0:51:08 } +2024-07-30 05:19:14,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 956/ 3125], loss: 0.491, per_step_time: 1413ms, lr: 1.3394442e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:14,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.65974 samples/s/p 0:51:05 } +2024-07-30 05:19:17,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 958/ 3125], loss: 0.460, per_step_time: 1413ms, lr: 1.3370919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:17,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.65836 samples/s/p 0:51:03 } +2024-07-30 05:19:20,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 960/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 1.3347413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:20,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.65775 samples/s/p 0:51:01 } +2024-07-30 05:19:23,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 962/ 3125], loss: 0.367, per_step_time: 1413ms, lr: 1.3323923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:23,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.65966 samples/s/p 0:50:57 } +2024-07-30 05:19:25,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 964/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 1.3300445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:25,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.65911 samples/s/p 0:50:54 } +2024-07-30 05:19:28,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 966/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 1.3276988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:28,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.65983 samples/s/p 0:50:51 } +2024-07-30 05:19:31,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 968/ 3125], loss: 0.222, per_step_time: 1414ms, lr: 1.3253546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:31,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.65640 samples/s/p 0:50:50 } +2024-07-30 05:19:34,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 970/ 3125], loss: 0.281, per_step_time: 1412ms, lr: 1.3230127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:34,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.66205 samples/s/p 0:50:44 } +2024-07-30 05:19:37,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 972/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 1.3206726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:37,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.65840 samples/s/p 0:50:43 } +2024-07-30 05:19:40,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 974/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 1.3183341e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:40,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.65845 samples/s/p 0:50:41 } +2024-07-30 05:19:42,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 976/ 3125], loss: 0.179, per_step_time: 1414ms, lr: 1.3159975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:42,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.65436 samples/s/p 0:50:40 } +2024-07-30 05:19:45,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 978/ 3125], loss: 0.212, per_step_time: 1415ms, lr: 1.3136619e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:45,808 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.65313 samples/s/p 0:50:38 } +2024-07-30 05:19:48,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 980/ 3125], loss: 0.332, per_step_time: 1417ms, lr: 1.3113287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:48,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.64527 samples/s/p 0:50:39 } +2024-07-30 05:19:51,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 982/ 3125], loss: 0.478, per_step_time: 1414ms, lr: 1.3089972e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:51,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.65492 samples/s/p 0:50:31 } +2024-07-30 05:19:54,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 984/ 3125], loss: 0.330, per_step_time: 1413ms, lr: 1.3066679e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:54,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.66150 samples/s/p 0:50:25 } +2024-07-30 05:19:57,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 986/ 3125], loss: 0.351, per_step_time: 1414ms, lr: 1.30434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:57,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.65751 samples/s/p 0:50:24 } +2024-07-30 05:19:59,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 988/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 1.302014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:59,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.65968 samples/s/p 0:50:20 } +2024-07-30 05:20:02,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 990/ 3125], loss: 0.295, per_step_time: 1412ms, lr: 1.2996887e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:02,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.66238 samples/s/p 0:50:16 } +2024-07-30 05:20:05,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 992/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 1.2973654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:05,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.65927 samples/s/p 0:50:15 } +2024-07-30 05:20:08,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 994/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 1.2950447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:08,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.66079 samples/s/p 0:50:11 } +2024-07-30 05:20:11,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 996/ 3125], loss: 0.069, per_step_time: 1413ms, lr: 1.2927258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:11,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.66007 samples/s/p 0:50:09 } +2024-07-30 05:20:14,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 998/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 1.2904086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:14,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.66026 samples/s/p 0:50:06 } +2024-07-30 05:20:16,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1000/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 1.288093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:16,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.66130 samples/s/p 0:50:02 } +2024-07-30 05:20:19,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1002/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 1.2857795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:19,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.66099 samples/s/p 0:50:00 } +2024-07-30 05:20:22,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1004/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 1.2834673e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:22,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.66146 samples/s/p 0:49:57 } +2024-07-30 05:20:25,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1006/ 3125], loss: 0.276, per_step_time: 1415ms, lr: 1.2811565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:25,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.65262 samples/s/p 0:49:58 } +2024-07-30 05:20:28,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1008/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 1.2788483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:28,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.65778 samples/s/p 0:49:53 } +2024-07-30 05:20:31,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1010/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 1.2765416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:31,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.66102 samples/s/p 0:49:48 } +2024-07-30 05:20:33,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1012/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 1.2742358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:33,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.65937 samples/s/p 0:49:46 } +2024-07-30 05:20:36,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1014/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 1.271933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:36,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.65691 samples/s/p 0:49:45 } +2024-07-30 05:20:39,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1016/ 3125], loss: 0.141, per_step_time: 1413ms, lr: 1.2696316e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:39,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.65904 samples/s/p 0:49:41 } +2024-07-30 05:20:42,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1018/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 1.2673321e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:42,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.65804 samples/s/p 0:49:39 } +2024-07-30 05:20:45,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1020/ 3125], loss: 0.304, per_step_time: 1414ms, lr: 1.2650338e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:45,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.65722 samples/s/p 0:49:36 } +2024-07-30 05:20:48,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1022/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 1.2627381e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:48,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.65835 samples/s/p 0:49:33 } +2024-07-30 05:20:51,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1024/ 3125], loss: 0.189, per_step_time: 1414ms, lr: 1.2604439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:51,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.65561 samples/s/p 0:49:31 } +2024-07-30 05:20:53,840 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1026/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 1.2581515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:53,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.66130 samples/s/p 0:49:26 } +2024-07-30 05:20:56,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1028/ 3125], loss: 0.138, per_step_time: 1415ms, lr: 1.2558612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:56,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.65084 samples/s/p 0:49:28 } +2024-07-30 05:20:59,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1030/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 1.2535721e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:59,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.66127 samples/s/p 0:49:20 } +2024-07-30 05:21:02,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1032/ 3125], loss: 0.270, per_step_time: 1414ms, lr: 1.2512851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:02,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.65498 samples/s/p 0:49:20 } +2024-07-30 05:21:05,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1034/ 3125], loss: 0.368, per_step_time: 1413ms, lr: 1.2489995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:05,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.66150 samples/s/p 0:49:14 } +2024-07-30 05:21:08,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1036/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 1.2467151e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:08,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.65833 samples/s/p 0:49:13 } +2024-07-30 05:21:10,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1038/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 1.2444335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:10,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.66080 samples/s/p 0:49:09 } +2024-07-30 05:21:13,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1040/ 3125], loss: 0.436, per_step_time: 1412ms, lr: 1.2421536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:13,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.66186 samples/s/p 0:49:06 } +2024-07-30 05:21:16,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1042/ 3125], loss: 0.456, per_step_time: 1413ms, lr: 1.2398758e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:16,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.65967 samples/s/p 0:49:04 } +2024-07-30 05:21:19,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1044/ 3125], loss: 0.248, per_step_time: 1414ms, lr: 1.2375996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:19,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.65753 samples/s/p 0:49:02 } +2024-07-30 05:21:22,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1046/ 3125], loss: 0.215, per_step_time: 1412ms, lr: 1.2353253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:22,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.66200 samples/s/p 0:48:57 } +2024-07-30 05:21:25,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1048/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 1.2330526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:25,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.65831 samples/s/p 0:48:56 } +2024-07-30 05:21:27,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1050/ 3125], loss: 0.259, per_step_time: 1412ms, lr: 1.2307808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:27,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.66176 samples/s/p 0:48:51 } +2024-07-30 05:21:30,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1052/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 1.2285119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:30,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.65899 samples/s/p 0:48:50 } +2024-07-30 05:21:33,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1054/ 3125], loss: 0.209, per_step_time: 1412ms, lr: 1.2262445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:33,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.66198 samples/s/p 0:48:46 } +2024-07-30 05:21:36,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1056/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 1.2239792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:36,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.65856 samples/s/p 0:48:45 } +2024-07-30 05:21:39,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1058/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 1.2217149e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:39,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.66013 samples/s/p 0:48:41 } +2024-07-30 05:21:42,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1060/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 1.2194532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:42,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.65915 samples/s/p 0:48:39 } +2024-07-30 05:21:44,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1062/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 1.2171932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:44,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.66148 samples/s/p 0:48:35 } +2024-07-30 05:21:47,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1064/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 1.214934e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:47,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |███████████████████████████████████████ | 5.65961 samples/s/p 0:48:33 } +2024-07-30 05:21:50,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1066/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 1.2126776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:50,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |███████████████████████████████████████ | 5.66084 samples/s/p 0:48:29 } +2024-07-30 05:21:53,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1068/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 1.2104231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:53,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.66016 samples/s/p 0:48:27 } +2024-07-30 05:21:56,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1070/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 1.2081704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:56,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.65874 samples/s/p 0:48:25 } +2024-07-30 05:21:59,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1072/ 3125], loss: 0.303, per_step_time: 1414ms, lr: 1.2059196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:59,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.65734 samples/s/p 0:48:23 } +2024-07-30 05:22:01,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1074/ 3125], loss: 0.290, per_step_time: 1414ms, lr: 1.2036704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:01,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.65468 samples/s/p 0:48:21 } +2024-07-30 05:22:04,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1076/ 3125], loss: 0.046, per_step_time: 1413ms, lr: 1.2014228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:04,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.66135 samples/s/p 0:48:15 } +2024-07-30 05:22:07,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1078/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 1.1991766e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:07,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.65901 samples/s/p 0:48:13 } +2024-07-30 05:22:10,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1080/ 3125], loss: 0.406, per_step_time: 1415ms, lr: 1.1969328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:10,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.65306 samples/s/p 0:48:14 } +2024-07-30 05:22:13,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1082/ 3125], loss: 0.318, per_step_time: 1414ms, lr: 1.1946902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:13,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.65711 samples/s/p 0:48:09 } +2024-07-30 05:22:16,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1084/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 1.1924502e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:16,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.66080 samples/s/p 0:48:04 } +2024-07-30 05:22:18,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1086/ 3125], loss: 0.321, per_step_time: 1412ms, lr: 1.1902121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:18,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.66182 samples/s/p 0:48:01 } +2024-07-30 05:22:21,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1088/ 3125], loss: 0.171, per_step_time: 1415ms, lr: 1.1879754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:21,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.65268 samples/s/p 0:48:02 } +2024-07-30 05:22:24,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1090/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 1.1857411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:24,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.65872 samples/s/p 0:47:56 } +2024-07-30 05:22:27,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1092/ 3125], loss: 0.198, per_step_time: 1414ms, lr: 1.1835074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:27,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.65524 samples/s/p 0:47:55 } +2024-07-30 05:22:30,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1094/ 3125], loss: 0.198, per_step_time: 1412ms, lr: 1.1812764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:30,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.66216 samples/s/p 0:47:49 } +2024-07-30 05:22:33,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1096/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 1.1790472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:33,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.66106 samples/s/p 0:47:47 } +2024-07-30 05:22:35,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1098/ 3125], loss: 0.470, per_step_time: 1414ms, lr: 1.1768198e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:35,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.65711 samples/s/p 0:47:46 } +2024-07-30 05:22:38,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1100/ 3125], loss: 0.447, per_step_time: 1414ms, lr: 1.1745944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:38,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.65743 samples/s/p 0:47:43 } +2024-07-30 05:22:41,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1102/ 3125], loss: 0.428, per_step_time: 1413ms, lr: 1.1723699e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:41,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.66124 samples/s/p 0:47:38 } +2024-07-30 05:22:44,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1104/ 3125], loss: 0.231, per_step_time: 1412ms, lr: 1.1701483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:44,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.66230 samples/s/p 0:47:35 } +2024-07-30 05:22:47,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1106/ 3125], loss: 0.515, per_step_time: 1413ms, lr: 1.167928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:47,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.66012 samples/s/p 0:47:33 } +2024-07-30 05:22:50,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1108/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 1.1657089e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:50,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.65870 samples/s/p 0:47:31 } +2024-07-30 05:22:52,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1110/ 3125], loss: 0.265, per_step_time: 1414ms, lr: 1.1634928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:52,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.65564 samples/s/p 0:47:30 } +2024-07-30 05:22:55,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1112/ 3125], loss: 0.417, per_step_time: 1414ms, lr: 1.1612782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:55,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.65720 samples/s/p 0:47:26 } +2024-07-30 05:22:58,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1114/ 3125], loss: 0.305, per_step_time: 1414ms, lr: 1.1590654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:58,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.65376 samples/s/p 0:47:25 } +2024-07-30 05:23:01,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1116/ 3125], loss: 0.349, per_step_time: 1413ms, lr: 1.1568549e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:01,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.65799 samples/s/p 0:47:20 } +2024-07-30 05:23:04,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1118/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 1.1546457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:04,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.65965 samples/s/p 0:47:16 } +2024-07-30 05:23:07,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1120/ 3125], loss: 0.324, per_step_time: 1414ms, lr: 1.1524385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:07,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.65764 samples/s/p 0:47:15 } +2024-07-30 05:23:09,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1122/ 3125], loss: 0.327, per_step_time: 1413ms, lr: 1.1502325e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:09,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.66067 samples/s/p 0:47:10 } +2024-07-30 05:23:12,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1124/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 1.1480287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:12,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.66053 samples/s/p 0:47:08 } +2024-07-30 05:23:15,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1126/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 1.1458262e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:15,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.66080 samples/s/p 0:47:05 } +2024-07-30 05:23:18,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1128/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 1.1436265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:18,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.66027 samples/s/p 0:47:02 } +2024-07-30 05:23:21,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1130/ 3125], loss: 0.113, per_step_time: 1412ms, lr: 1.1414284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:21,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.66247 samples/s/p 0:46:58 } +2024-07-30 05:23:24,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1132/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 1.1392325e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:24,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.65936 samples/s/p 0:46:57 } +2024-07-30 05:23:26,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1134/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 1.1370381e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:26,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.66011 samples/s/p 0:46:54 } +2024-07-30 05:23:29,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1136/ 3125], loss: 0.082, per_step_time: 1413ms, lr: 1.1348446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:29,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.66144 samples/s/p 0:46:50 } +2024-07-30 05:23:32,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1138/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 1.1326542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:32,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.65844 samples/s/p 0:46:49 } +2024-07-30 05:23:35,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1140/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 1.1304655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:35,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.66071 samples/s/p 0:46:45 } +2024-07-30 05:23:38,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1142/ 3125], loss: 0.176, per_step_time: 1412ms, lr: 1.1282783e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:38,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.66234 samples/s/p 0:46:41 } +2024-07-30 05:23:41,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1144/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 1.1260936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:41,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.66059 samples/s/p 0:46:39 } +2024-07-30 05:23:43,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1146/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 1.1239093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:43,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.66056 samples/s/p 0:46:36 } +2024-07-30 05:23:46,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1148/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 1.1217281e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:46,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.65518 samples/s/p 0:46:36 } +2024-07-30 05:23:49,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1150/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 1.1195477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:49,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.66047 samples/s/p 0:46:31 } +2024-07-30 05:23:52,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1152/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 1.1173704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:52,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.66080 samples/s/p 0:46:28 } +2024-07-30 05:23:55,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1154/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 1.1151942e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:55,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.66056 samples/s/p 0:46:25 } +2024-07-30 05:23:58,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1156/ 3125], loss: 0.473, per_step_time: 1413ms, lr: 1.1130204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:58,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.66090 samples/s/p 0:46:22 } +2024-07-30 05:24:00,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1158/ 3125], loss: 0.317, per_step_time: 1415ms, lr: 1.1108484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:00,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.65228 samples/s/p 0:46:24 } +2024-07-30 05:24:03,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1160/ 3125], loss: 0.223, per_step_time: 1415ms, lr: 1.1086782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:03,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.65353 samples/s/p 0:46:20 } +2024-07-30 05:24:06,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1162/ 3125], loss: 0.360, per_step_time: 1414ms, lr: 1.1065096e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:06,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.65624 samples/s/p 0:46:16 } +2024-07-30 05:24:09,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1164/ 3125], loss: 0.130, per_step_time: 1413ms, lr: 1.1043423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:09,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.65926 samples/s/p 0:46:12 } +2024-07-30 05:24:12,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1166/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 1.1021775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:12,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.65952 samples/s/p 0:46:09 } +2024-07-30 05:24:15,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1168/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 1.1000147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:15,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.65879 samples/s/p 0:46:06 } +2024-07-30 05:24:17,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1170/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 1.0978531e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:17,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.66101 samples/s/p 0:46:02 } +2024-07-30 05:24:20,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1172/ 3125], loss: 0.636, per_step_time: 1413ms, lr: 1.0956943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:20,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.65810 samples/s/p 0:46:01 } +2024-07-30 05:24:23,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1174/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 1.0935369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:23,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.65902 samples/s/p 0:45:58 } +2024-07-30 05:24:26,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1176/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 1.0913816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:26,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.66032 samples/s/p 0:45:54 } +2024-07-30 05:24:29,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1178/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 1.0892278e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:29,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.65866 samples/s/p 0:45:52 } +2024-07-30 05:24:32,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1180/ 3125], loss: 0.293, per_step_time: 1417ms, lr: 1.0870757e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:32,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.64540 samples/s/p 0:45:56 } +2024-07-30 05:24:34,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1182/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 1.0849258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:34,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.66011 samples/s/p 0:45:46 } +2024-07-30 05:24:37,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1184/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 1.082778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:37,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.66040 samples/s/p 0:45:43 } +2024-07-30 05:24:40,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1186/ 3125], loss: 0.209, per_step_time: 1415ms, lr: 1.0806319e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:40,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.65289 samples/s/p 0:45:44 } +2024-07-30 05:24:43,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1188/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 1.0784879e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:43,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.65975 samples/s/p 0:45:37 } +2024-07-30 05:24:46,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1190/ 3125], loss: 0.440, per_step_time: 1412ms, lr: 1.0763446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:46,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.66201 samples/s/p 0:45:34 } +2024-07-30 05:24:49,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1192/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 1.0742044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:49,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.65942 samples/s/p 0:45:32 } +2024-07-30 05:24:51,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1194/ 3125], loss: 0.216, per_step_time: 1412ms, lr: 1.0720652e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:51,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.66201 samples/s/p 0:45:28 } +2024-07-30 05:24:54,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1196/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 1.0699284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:54,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.66061 samples/s/p 0:45:26 } +2024-07-30 05:24:57,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1198/ 3125], loss: 0.130, per_step_time: 1414ms, lr: 1.0677936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:57,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.65673 samples/s/p 0:45:25 } +2024-07-30 05:25:00,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1200/ 3125], loss: 0.418, per_step_time: 1414ms, lr: 1.0656607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:00,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.65701 samples/s/p 0:45:22 } +2024-07-30 05:25:03,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1202/ 3125], loss: 0.381, per_step_time: 1415ms, lr: 1.0635296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:03,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.65249 samples/s/p 0:45:21 } +2024-07-30 05:25:06,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1204/ 3125], loss: 0.090, per_step_time: 1416ms, lr: 1.0614004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:06,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.64734 samples/s/p 0:45:21 } +2024-07-30 05:25:08,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1206/ 3125], loss: 0.344, per_step_time: 1416ms, lr: 1.0592731e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:08,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.64671 samples/s/p 0:45:18 } +2024-07-30 05:25:11,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1208/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 1.0571473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:11,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.66016 samples/s/p 0:45:09 } +2024-07-30 05:25:14,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1210/ 3125], loss: 0.137, per_step_time: 1412ms, lr: 1.055024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:14,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.66302 samples/s/p 0:45:05 } +2024-07-30 05:25:17,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1212/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 1.0529023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:17,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.65941 samples/s/p 0:45:04 } +2024-07-30 05:25:20,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1214/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 1.0507816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:20,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.66154 samples/s/p 0:45:00 } +2024-07-30 05:25:23,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1216/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 1.0486639e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:23,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.65975 samples/s/p 0:44:58 } +2024-07-30 05:25:25,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1218/ 3125], loss: 0.406, per_step_time: 1413ms, lr: 1.0465478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:25,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.66001 samples/s/p 0:44:55 } +2024-07-30 05:25:28,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1220/ 3125], loss: 0.091, per_step_time: 1413ms, lr: 1.0444339e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:28,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.66046 samples/s/p 0:44:52 } +2024-07-30 05:25:31,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1222/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 1.0423207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:31,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.65921 samples/s/p 0:44:50 } +2024-07-30 05:25:34,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1224/ 3125], loss: 0.416, per_step_time: 1413ms, lr: 1.0402107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:34,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.66097 samples/s/p 0:44:46 } +2024-07-30 05:25:37,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1226/ 3125], loss: 0.082, per_step_time: 1412ms, lr: 1.0381021e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:37,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.66182 samples/s/p 0:44:43 } +2024-07-30 05:25:40,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1228/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 1.0359954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:40,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.66008 samples/s/p 0:44:41 } +2024-07-30 05:25:42,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1230/ 3125], loss: 0.169, per_step_time: 1412ms, lr: 1.0338911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:42,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.66283 samples/s/p 0:44:37 } +2024-07-30 05:25:45,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1232/ 3125], loss: 0.450, per_step_time: 1413ms, lr: 1.0317883e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:45,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.65868 samples/s/p 0:44:36 } +2024-07-30 05:25:48,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1234/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 1.0296869e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:48,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.66118 samples/s/p 0:44:32 } +2024-07-30 05:25:51,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1236/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 1.0275876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:51,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.66020 samples/s/p 0:44:29 } +2024-07-30 05:25:54,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1238/ 3125], loss: 0.423, per_step_time: 1416ms, lr: 1.0254902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:54,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.64838 samples/s/p 0:44:32 } +2024-07-30 05:25:57,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1240/ 3125], loss: 0.179, per_step_time: 1412ms, lr: 1.023395e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:57,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.66211 samples/s/p 0:44:23 } +2024-07-30 05:25:59,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1242/ 3125], loss: 0.130, per_step_time: 1412ms, lr: 1.0213017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:59,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.66192 samples/s/p 0:44:20 } +2024-07-30 05:26:02,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1244/ 3125], loss: 0.291, per_step_time: 1413ms, lr: 1.0192105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:02,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.65943 samples/s/p 0:44:18 } +2024-07-30 05:26:05,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1246/ 3125], loss: 0.129, per_step_time: 1414ms, lr: 1.0171208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:05,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |███████████████████████████████████████ | 5.65568 samples/s/p 0:44:17 } +2024-07-30 05:26:08,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1248/ 3125], loss: 0.165, per_step_time: 1415ms, lr: 1.0150334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:08,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |███████████████████████████████████████ | 5.65262 samples/s/p 0:44:16 } +2024-07-30 05:26:11,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1250/ 3125], loss: 0.405, per_step_time: 1413ms, lr: 1.0129478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:11,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.66044 samples/s/p 0:44:09 } +2024-07-30 05:26:14,140 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1252/ 3125], loss: 0.290, per_step_time: 1414ms, lr: 1.0108635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:14,140 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.65648 samples/s/p 0:44:08 } +2024-07-30 05:26:16,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1254/ 3125], loss: 0.194, per_step_time: 1415ms, lr: 1.0087817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:16,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.65061 samples/s/p 0:44:08 } +2024-07-30 05:26:19,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1256/ 3125], loss: 0.357, per_step_time: 1414ms, lr: 1.0067016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:19,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.65752 samples/s/p 0:44:02 } +2024-07-30 05:26:22,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1258/ 3125], loss: 0.241, per_step_time: 1414ms, lr: 1.0046228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:22,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.65751 samples/s/p 0:44:00 } +2024-07-30 05:26:25,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1260/ 3125], loss: 0.385, per_step_time: 1413ms, lr: 1.0025468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:25,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.65860 samples/s/p 0:43:56 } +2024-07-30 05:26:28,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1262/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 1.0004726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:28,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.66036 samples/s/p 0:43:53 } +2024-07-30 05:26:31,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1264/ 3125], loss: 0.344, per_step_time: 1414ms, lr: 9.984001e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:31,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.65378 samples/s/p 0:43:53 } +2024-07-30 05:26:33,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1266/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 9.963288e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:33,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.66016 samples/s/p 0:43:47 } +2024-07-30 05:26:36,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1268/ 3125], loss: 0.256, per_step_time: 1412ms, lr: 9.942609e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:36,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.66221 samples/s/p 0:43:43 } +2024-07-30 05:26:39,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1270/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 9.921941e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:39,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.66137 samples/s/p 0:43:41 } +2024-07-30 05:26:42,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1272/ 3125], loss: 0.419, per_step_time: 1419ms, lr: 9.901294e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:42,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.63524 samples/s/p 0:43:50 } +2024-07-30 05:26:45,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1274/ 3125], loss: 0.539, per_step_time: 1413ms, lr: 9.880667e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:45,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.66111 samples/s/p 0:43:35 } +2024-07-30 05:26:48,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1276/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 9.86006e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:48,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.65963 samples/s/p 0:43:33 } +2024-07-30 05:26:50,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1278/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 9.839463e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:51,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.66118 samples/s/p 0:43:30 } +2024-07-30 05:26:53,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1280/ 3125], loss: 0.264, per_step_time: 1412ms, lr: 9.818893e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:53,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.66195 samples/s/p 0:43:26 } +2024-07-30 05:26:56,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1282/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 9.798335e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:56,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.65878 samples/s/p 0:43:25 } +2024-07-30 05:26:59,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1284/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 9.777805e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:59,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.65993 samples/s/p 0:43:22 } +2024-07-30 05:27:02,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1286/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 9.757292e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:02,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.66137 samples/s/p 0:43:18 } +2024-07-30 05:27:05,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1288/ 3125], loss: 0.435, per_step_time: 1413ms, lr: 9.7368e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:05,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.66144 samples/s/p 0:43:15 } +2024-07-30 05:27:08,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1290/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 9.716326e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:08,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.66079 samples/s/p 0:43:13 } +2024-07-30 05:27:10,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1292/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 9.695873e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:10,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.65967 samples/s/p 0:43:10 } +2024-07-30 05:27:13,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1294/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 9.675427e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:13,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.66085 samples/s/p 0:43:07 } +2024-07-30 05:27:16,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1296/ 3125], loss: 0.406, per_step_time: 1413ms, lr: 9.655014e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:16,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.66082 samples/s/p 0:43:04 } +2024-07-30 05:27:19,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1298/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 9.634616e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:19,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.66043 samples/s/p 0:43:02 } +2024-07-30 05:27:22,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1300/ 3125], loss: 0.304, per_step_time: 1412ms, lr: 9.614238e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:22,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.66321 samples/s/p 0:42:58 } +2024-07-30 05:27:25,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1302/ 3125], loss: 0.200, per_step_time: 1415ms, lr: 9.593874e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:25,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.65309 samples/s/p 0:42:59 } +2024-07-30 05:27:27,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1304/ 3125], loss: 0.065, per_step_time: 1413ms, lr: 9.573533e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:27,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.66137 samples/s/p 0:42:53 } +2024-07-30 05:27:30,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1306/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 9.553214e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:30,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.65852 samples/s/p 0:42:51 } +2024-07-30 05:27:33,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1308/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 9.532913e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:33,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.65447 samples/s/p 0:42:50 } +2024-07-30 05:27:36,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1310/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 9.512627e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:36,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.65802 samples/s/p 0:42:46 } +2024-07-30 05:27:39,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1312/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 9.4923644e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:39,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.66060 samples/s/p 0:42:42 } +2024-07-30 05:27:42,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1314/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 9.4721196e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:42,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.66099 samples/s/p 0:42:39 } +2024-07-30 05:27:44,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1316/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 9.4518987e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:44,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.65940 samples/s/p 0:42:37 } +2024-07-30 05:27:47,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1318/ 3125], loss: 0.449, per_step_time: 1412ms, lr: 9.4316925e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:47,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.66180 samples/s/p 0:42:33 } +2024-07-30 05:27:50,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1320/ 3125], loss: 0.109, per_step_time: 1413ms, lr: 9.4115137e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:50,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.66124 samples/s/p 0:42:30 } +2024-07-30 05:27:53,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1322/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 9.391346e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:53,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.65923 samples/s/p 0:42:28 } +2024-07-30 05:27:56,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1324/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 9.371191e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:56,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.66099 samples/s/p 0:42:25 } +2024-07-30 05:27:59,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1326/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 9.3510596e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:59,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.65890 samples/s/p 0:42:23 } +2024-07-30 05:28:01,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1328/ 3125], loss: 0.412, per_step_time: 1413ms, lr: 9.330952e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:01,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.66030 samples/s/p 0:42:19 } +2024-07-30 05:28:04,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1330/ 3125], loss: 0.522, per_step_time: 1414ms, lr: 9.310865e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:04,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.65423 samples/s/p 0:42:19 } +2024-07-30 05:28:07,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1332/ 3125], loss: 0.282, per_step_time: 1415ms, lr: 9.2907993e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:07,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.65277 samples/s/p 0:42:17 } +2024-07-30 05:28:10,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1334/ 3125], loss: 0.511, per_step_time: 1413ms, lr: 9.270751e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:10,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.66071 samples/s/p 0:42:11 } +2024-07-30 05:28:13,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1336/ 3125], loss: 0.386, per_step_time: 1414ms, lr: 9.2507213e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:13,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.65722 samples/s/p 0:42:09 } +2024-07-30 05:28:16,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1338/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 9.230703e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:16,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.65793 samples/s/p 0:42:06 } +2024-07-30 05:28:18,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1340/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 9.2107143e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:18,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.65800 samples/s/p 0:42:03 } +2024-07-30 05:28:21,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1342/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 9.190744e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:21,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.65833 samples/s/p 0:42:00 } +2024-07-30 05:28:24,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1344/ 3125], loss: 0.151, per_step_time: 1413ms, lr: 9.1707915e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:24,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.66126 samples/s/p 0:41:56 } +2024-07-30 05:28:27,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1346/ 3125], loss: 0.495, per_step_time: 1413ms, lr: 9.1508593e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:27,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.66128 samples/s/p 0:41:53 } +2024-07-30 05:28:30,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1348/ 3125], loss: 0.077, per_step_time: 1413ms, lr: 9.1309425e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:30,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.66020 samples/s/p 0:41:51 } +2024-07-30 05:28:33,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1350/ 3125], loss: 0.083, per_step_time: 1412ms, lr: 9.1110496e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:33,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.66297 samples/s/p 0:41:47 } +2024-07-30 05:28:35,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1352/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 9.0911686e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:35,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.65880 samples/s/p 0:41:46 } +2024-07-30 05:28:38,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1354/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 9.071317e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:38,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.66047 samples/s/p 0:41:42 } +2024-07-30 05:28:41,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1356/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 9.0514806e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:41,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.66069 samples/s/p 0:41:40 } +2024-07-30 05:28:44,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1358/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 9.0316684e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:44,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.66077 samples/s/p 0:41:37 } +2024-07-30 05:28:47,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1360/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 9.011873e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:47,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.66067 samples/s/p 0:41:34 } +2024-07-30 05:28:50,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1362/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 8.992097e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:50,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.65977 samples/s/p 0:41:31 } +2024-07-30 05:28:52,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1364/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 8.972341e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:52,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.65919 samples/s/p 0:41:29 } +2024-07-30 05:28:55,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1366/ 3125], loss: 0.187, per_step_time: 1414ms, lr: 8.9526e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:55,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.65693 samples/s/p 0:41:27 } +2024-07-30 05:28:58,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1368/ 3125], loss: 0.402, per_step_time: 1414ms, lr: 8.9328825e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:58,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.65713 samples/s/p 0:41:24 } +2024-07-30 05:29:01,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1370/ 3125], loss: 0.166, per_step_time: 1412ms, lr: 8.913186e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:01,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.66204 samples/s/p 0:41:19 } +2024-07-30 05:29:04,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1372/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 8.8935013e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:04,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.65913 samples/s/p 0:41:18 } +2024-07-30 05:29:07,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1374/ 3125], loss: 0.073, per_step_time: 1413ms, lr: 8.873841e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:07,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.66145 samples/s/p 0:41:14 } +2024-07-30 05:29:09,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1376/ 3125], loss: 0.277, per_step_time: 1412ms, lr: 8.854207e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:09,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.66330 samples/s/p 0:41:10 } +2024-07-30 05:29:12,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1378/ 3125], loss: 0.185, per_step_time: 1412ms, lr: 8.834588e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:12,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.66197 samples/s/p 0:41:08 } +2024-07-30 05:29:15,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1380/ 3125], loss: 0.412, per_step_time: 1413ms, lr: 8.8149875e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:15,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.66124 samples/s/p 0:41:05 } +2024-07-30 05:29:18,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1382/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 8.795401e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:18,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.66080 samples/s/p 0:41:03 } +2024-07-30 05:29:21,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1384/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 8.7758417e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:21,200 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.66053 samples/s/p 0:41:00 } +2024-07-30 05:29:24,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1386/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 8.7563006e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:24,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.66048 samples/s/p 0:40:57 } +2024-07-30 05:29:26,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1388/ 3125], loss: 0.225, per_step_time: 1412ms, lr: 8.736783e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:26,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.66236 samples/s/p 0:40:54 } +2024-07-30 05:29:29,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1390/ 3125], loss: 0.344, per_step_time: 1413ms, lr: 8.7172805e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:29,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.66062 samples/s/p 0:40:52 } +2024-07-30 05:29:32,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1392/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 8.697793e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:32,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.66055 samples/s/p 0:40:49 } +2024-07-30 05:29:35,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1394/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 8.678335e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:35,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.66065 samples/s/p 0:40:46 } +2024-07-30 05:29:38,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1396/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 8.658886e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:38,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.65835 samples/s/p 0:40:44 } +2024-07-30 05:29:41,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1398/ 3125], loss: 0.180, per_step_time: 1414ms, lr: 8.6394635e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:41,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.65452 samples/s/p 0:40:43 } +2024-07-30 05:29:43,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1400/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 8.620065e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:43,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.65877 samples/s/p 0:40:38 } +2024-07-30 05:29:46,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1402/ 3125], loss: 0.256, per_step_time: 1414ms, lr: 8.6006816e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:46,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.65378 samples/s/p 0:40:38 } +2024-07-30 05:29:49,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1404/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 8.581319e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:49,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.66146 samples/s/p 0:40:31 } +2024-07-30 05:29:52,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1406/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 8.5619746e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:52,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.65931 samples/s/p 0:40:29 } +2024-07-30 05:29:55,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1408/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 8.5426535e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:55,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.66051 samples/s/p 0:40:26 } +2024-07-30 05:29:58,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1410/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 8.523345e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:58,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.65910 samples/s/p 0:40:24 } +2024-07-30 05:30:00,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1412/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 8.5040597e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:00,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.65978 samples/s/p 0:40:21 } +2024-07-30 05:30:03,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1414/ 3125], loss: 0.133, per_step_time: 1414ms, lr: 8.4847983e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:03,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.65613 samples/s/p 0:40:20 } +2024-07-30 05:30:06,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1416/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 8.4655494e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:06,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.65823 samples/s/p 0:40:16 } +2024-07-30 05:30:09,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1418/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 8.446324e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:09,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.66021 samples/s/p 0:40:12 } +2024-07-30 05:30:12,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1420/ 3125], loss: 0.274, per_step_time: 1425ms, lr: 8.427119e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:12,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.61139 samples/s/p 0:40:30 } +2024-07-30 05:30:15,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1422/ 3125], loss: 0.061, per_step_time: 1413ms, lr: 8.407938e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:15,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.66137 samples/s/p 0:40:06 } +2024-07-30 05:30:17,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1424/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 8.3887664e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:17,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.66041 samples/s/p 0:40:04 } +2024-07-30 05:30:20,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1426/ 3125], loss: 0.204, per_step_time: 1414ms, lr: 8.3696216e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:20,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.65447 samples/s/p 0:40:03 } +2024-07-30 05:30:23,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1428/ 3125], loss: 0.108, per_step_time: 1413ms, lr: 8.3505e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:23,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.66033 samples/s/p 0:39:58 } +2024-07-30 05:30:26,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1430/ 3125], loss: 0.045, per_step_time: 1413ms, lr: 8.331391e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:26,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.65800 samples/s/p 0:39:56 } +2024-07-30 05:30:29,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1432/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 8.3123115e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:29,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.65971 samples/s/p 0:39:53 } +2024-07-30 05:30:32,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1434/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 8.293244e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:32,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |████████████████████████████████████████ | 5.66155 samples/s/p 0:39:49 } +2024-07-30 05:30:34,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1436/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 8.2741946e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:34,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |████████████████████████████████████████ | 5.65860 samples/s/p 0:39:47 } +2024-07-30 05:30:37,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1438/ 3125], loss: 0.568, per_step_time: 1413ms, lr: 8.2551685e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:37,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.65940 samples/s/p 0:39:44 } +2024-07-30 05:30:40,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1440/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 8.236155e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:40,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.66127 samples/s/p 0:39:41 } +2024-07-30 05:30:43,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1442/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 8.217174e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:43,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.66115 samples/s/p 0:39:38 } +2024-07-30 05:30:46,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1444/ 3125], loss: 0.327, per_step_time: 1413ms, lr: 8.1982074e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:46,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.66067 samples/s/p 0:39:35 } +2024-07-30 05:30:49,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1446/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 8.179262e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:49,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.66041 samples/s/p 0:39:32 } +2024-07-30 05:30:51,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1448/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 8.160338e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:51,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.66107 samples/s/p 0:39:29 } +2024-07-30 05:30:54,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1450/ 3125], loss: 0.391, per_step_time: 1412ms, lr: 8.141431e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:54,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.66256 samples/s/p 0:39:26 } +2024-07-30 05:30:57,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1452/ 3125], loss: 0.133, per_step_time: 1415ms, lr: 8.1225454e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:57,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.65121 samples/s/p 0:39:28 } +2024-07-30 05:31:00,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1454/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 8.1036774e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:00,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.66063 samples/s/p 0:39:21 } +2024-07-30 05:31:03,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1456/ 3125], loss: 0.208, per_step_time: 1412ms, lr: 8.0848275e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:03,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.66226 samples/s/p 0:39:18 } +2024-07-30 05:31:06,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1458/ 3125], loss: 0.203, per_step_time: 1412ms, lr: 8.0660044e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:06,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.66255 samples/s/p 0:39:15 } +2024-07-30 05:31:08,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1460/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 8.047193e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:08,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.65884 samples/s/p 0:39:13 } +2024-07-30 05:31:11,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1462/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 8.028409e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:11,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.65916 samples/s/p 0:39:10 } +2024-07-30 05:31:14,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1464/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 8.0096453e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:14,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.66052 samples/s/p 0:39:07 } +2024-07-30 05:31:17,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1466/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 7.9908966e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:17,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.65851 samples/s/p 0:39:05 } +2024-07-30 05:31:20,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1468/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 7.9721656e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:20,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.66086 samples/s/p 0:39:01 } +2024-07-30 05:31:23,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1470/ 3125], loss: 0.457, per_step_time: 1413ms, lr: 7.9534647e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:23,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.65992 samples/s/p 0:38:59 } +2024-07-30 05:31:25,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1472/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 7.9347785e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:25,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.66057 samples/s/p 0:38:56 } +2024-07-30 05:31:28,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1474/ 3125], loss: 0.316, per_step_time: 1415ms, lr: 7.916108e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:28,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.65367 samples/s/p 0:38:56 } +2024-07-30 05:31:31,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1476/ 3125], loss: 0.224, per_step_time: 1414ms, lr: 7.8974665e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:31,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.65765 samples/s/p 0:38:51 } +2024-07-30 05:31:34,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1478/ 3125], loss: 0.465, per_step_time: 1413ms, lr: 7.87884e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:34,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.65771 samples/s/p 0:38:48 } +2024-07-30 05:31:37,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1480/ 3125], loss: 0.287, per_step_time: 1414ms, lr: 7.860231e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:37,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.65768 samples/s/p 0:38:46 } +2024-07-30 05:31:40,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1482/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 7.841646e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:40,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.65839 samples/s/p 0:38:42 } +2024-07-30 05:31:42,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1484/ 3125], loss: 0.245, per_step_time: 1414ms, lr: 7.8230767e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:42,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.65641 samples/s/p 0:38:40 } +2024-07-30 05:31:45,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1486/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 7.804531e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:45,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.65882 samples/s/p 0:38:37 } +2024-07-30 05:31:48,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1488/ 3125], loss: 0.317, per_step_time: 1415ms, lr: 7.7860085e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:48,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.65310 samples/s/p 0:38:36 } +2024-07-30 05:31:51,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1490/ 3125], loss: 0.481, per_step_time: 1412ms, lr: 7.767504e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:51,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.66353 samples/s/p 0:38:29 } +2024-07-30 05:31:54,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1492/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 7.7490176e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:54,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.66101 samples/s/p 0:38:27 } +2024-07-30 05:31:57,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1494/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 7.7305555e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:57,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.65787 samples/s/p 0:38:26 } +2024-07-30 05:31:59,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1496/ 3125], loss: 0.301, per_step_time: 1413ms, lr: 7.7121075e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:59,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.66068 samples/s/p 0:38:22 } +2024-07-30 05:32:02,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1498/ 3125], loss: 0.152, per_step_time: 1412ms, lr: 7.693684e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:02,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.66215 samples/s/p 0:38:18 } +2024-07-30 05:32:05,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1500/ 3125], loss: 0.262, per_step_time: 1415ms, lr: 7.675281e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:05,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.65015 samples/s/p 0:38:20 } +2024-07-30 05:32:08,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1502/ 3125], loss: 0.083, per_step_time: 1413ms, lr: 7.656899e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:08,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.66033 samples/s/p 0:38:13 } +2024-07-30 05:32:11,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1504/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 7.6385317e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:11,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.66117 samples/s/p 0:38:10 } +2024-07-30 05:32:14,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1506/ 3125], loss: 0.193, per_step_time: 1414ms, lr: 7.6201883e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:14,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.65713 samples/s/p 0:38:09 } +2024-07-30 05:32:16,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1508/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 7.601866e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:16,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.66081 samples/s/p 0:38:05 } +2024-07-30 05:32:19,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1510/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 7.583564e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:19,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.65889 samples/s/p 0:38:03 } +2024-07-30 05:32:22,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1512/ 3125], loss: 0.093, per_step_time: 1413ms, lr: 7.5652775e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:22,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.66092 samples/s/p 0:37:59 } +2024-07-30 05:32:25,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1514/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 7.547015e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:25,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.66043 samples/s/p 0:37:56 } +2024-07-30 05:32:28,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1516/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 7.5287755e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:28,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.65908 samples/s/p 0:37:54 } +2024-07-30 05:32:31,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1518/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 7.5105544e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:31,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.66075 samples/s/p 0:37:51 } +2024-07-30 05:32:33,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1520/ 3125], loss: 0.386, per_step_time: 1412ms, lr: 7.492354e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:33,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.66242 samples/s/p 0:37:47 } +2024-07-30 05:32:36,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1522/ 3125], loss: 0.440, per_step_time: 1413ms, lr: 7.474175e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:36,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.65777 samples/s/p 0:37:46 } +2024-07-30 05:32:39,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1524/ 3125], loss: 0.357, per_step_time: 1413ms, lr: 7.4560074e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:39,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.66005 samples/s/p 0:37:42 } +2024-07-30 05:32:42,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1526/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 7.43787e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:42,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.66137 samples/s/p 0:37:39 } +2024-07-30 05:32:45,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1528/ 3125], loss: 0.246, per_step_time: 1414ms, lr: 7.419744e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:45,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.65638 samples/s/p 0:37:38 } +2024-07-30 05:32:48,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1530/ 3125], loss: 0.320, per_step_time: 1413ms, lr: 7.401645e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:48,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.65994 samples/s/p 0:37:34 } +2024-07-30 05:32:50,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1532/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 7.383564e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:50,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.65924 samples/s/p 0:37:31 } +2024-07-30 05:32:53,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1534/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 7.3655065e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:53,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.66141 samples/s/p 0:37:28 } +2024-07-30 05:32:56,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1536/ 3125], loss: 0.302, per_step_time: 1412ms, lr: 7.3474706e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:56,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.66332 samples/s/p 0:37:24 } +2024-07-30 05:32:59,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1538/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 7.3294547e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:59,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.66148 samples/s/p 0:37:22 } +2024-07-30 05:33:02,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1540/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 7.311451e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:02,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.65872 samples/s/p 0:37:20 } +2024-07-30 05:33:05,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1542/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 7.2934745e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:05,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.66036 samples/s/p 0:37:17 } +2024-07-30 05:33:07,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1544/ 3125], loss: 0.098, per_step_time: 1413ms, lr: 7.2755154e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:07,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.65973 samples/s/p 0:37:14 } +2024-07-30 05:33:10,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1546/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 7.2575807e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:10,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.65982 samples/s/p 0:37:11 } +2024-07-30 05:33:13,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1548/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 7.23966e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:13,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.65938 samples/s/p 0:37:09 } +2024-07-30 05:33:16,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1550/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 7.221764e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:16,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.65794 samples/s/p 0:37:06 } +2024-07-30 05:33:19,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1552/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 7.2038887e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:19,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.65871 samples/s/p 0:37:03 } +2024-07-30 05:33:22,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1554/ 3125], loss: 0.220, per_step_time: 1414ms, lr: 7.186028e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:22,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.65768 samples/s/p 0:37:01 } +2024-07-30 05:33:24,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1556/ 3125], loss: 0.212, per_step_time: 1412ms, lr: 7.168197e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:24,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.66238 samples/s/p 0:36:56 } +2024-07-30 05:33:27,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1558/ 3125], loss: 0.151, per_step_time: 1424ms, lr: 7.1503814e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:27,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.61490 samples/s/p 0:37:12 } +2024-07-30 05:33:30,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1560/ 3125], loss: 0.207, per_step_time: 1414ms, lr: 7.1325894e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:30,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.65693 samples/s/p 0:36:53 } +2024-07-30 05:33:33,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1562/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 7.1148185e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:33,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.65775 samples/s/p 0:36:50 } +2024-07-30 05:33:36,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1564/ 3125], loss: 0.232, per_step_time: 1414ms, lr: 7.097065e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:36,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.65424 samples/s/p 0:36:48 } +2024-07-30 05:33:39,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1566/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 7.079333e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:39,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.65833 samples/s/p 0:36:44 } +2024-07-30 05:33:41,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1568/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 7.061618e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:41,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.66008 samples/s/p 0:36:40 } +2024-07-30 05:33:44,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1570/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 7.043928e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:44,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.66075 samples/s/p 0:36:37 } +2024-07-30 05:33:47,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1572/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 7.026252e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:47,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.65967 samples/s/p 0:36:35 } +2024-07-30 05:33:50,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1574/ 3125], loss: 0.055, per_step_time: 1412ms, lr: 7.008603e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:50,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.66233 samples/s/p 0:36:31 } +2024-07-30 05:33:53,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1576/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 6.990972e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:53,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.66113 samples/s/p 0:36:28 } +2024-07-30 05:33:56,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1578/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 6.973365e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:56,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.65949 samples/s/p 0:36:26 } +2024-07-30 05:33:58,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1580/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 6.9557757e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:58,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.66104 samples/s/p 0:36:23 } +2024-07-30 05:34:01,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1582/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 6.93821e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:01,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.65975 samples/s/p 0:36:21 } +2024-07-30 05:34:04,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1584/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 6.920656e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:04,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.66141 samples/s/p 0:36:17 } +2024-07-30 05:34:07,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1586/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 6.9031324e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:07,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.66065 samples/s/p 0:36:15 } +2024-07-30 05:34:10,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1588/ 3125], loss: 0.271, per_step_time: 1416ms, lr: 6.8856235e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:10,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.64935 samples/s/p 0:36:16 } +2024-07-30 05:34:13,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1590/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 6.868142e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:13,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.66160 samples/s/p 0:36:08 } +2024-07-30 05:34:16,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1592/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 6.8506716e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:16,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.66060 samples/s/p 0:36:06 } +2024-07-30 05:34:18,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1594/ 3125], loss: 0.330, per_step_time: 1414ms, lr: 6.833228e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:18,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.65549 samples/s/p 0:36:05 } +2024-07-30 05:34:21,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1596/ 3125], loss: 0.382, per_step_time: 1413ms, lr: 6.8158056e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:21,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.66044 samples/s/p 0:36:00 } +2024-07-30 05:34:24,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1598/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 6.7983956e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:24,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.66047 samples/s/p 0:35:58 } +2024-07-30 05:34:27,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1600/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 6.7810146e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:27,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.66024 samples/s/p 0:35:55 } +2024-07-30 05:34:30,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1602/ 3125], loss: 0.294, per_step_time: 1413ms, lr: 6.763652e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:30,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.65777 samples/s/p 0:35:53 } +2024-07-30 05:34:33,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1604/ 3125], loss: 0.324, per_step_time: 1414ms, lr: 6.74631e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:33,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.65729 samples/s/p 0:35:50 } +2024-07-30 05:34:35,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1606/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 6.7289915e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:35,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.65863 samples/s/p 0:35:47 } +2024-07-30 05:34:38,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1608/ 3125], loss: 0.196, per_step_time: 1414ms, lr: 6.711691e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:38,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.65602 samples/s/p 0:35:45 } +2024-07-30 05:34:41,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1610/ 3125], loss: 0.134, per_step_time: 1412ms, lr: 6.694412e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:41,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.66230 samples/s/p 0:35:40 } +2024-07-30 05:34:44,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1612/ 3125], loss: 0.206, per_step_time: 1415ms, lr: 6.67715e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:44,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.65164 samples/s/p 0:35:41 } +2024-07-30 05:34:47,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1614/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 6.659913e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:47,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.65991 samples/s/p 0:35:35 } +2024-07-30 05:34:50,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1616/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 6.64269e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:50,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.66081 samples/s/p 0:35:32 } +2024-07-30 05:34:52,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1618/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 6.6254944e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:52,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.66084 samples/s/p 0:35:29 } +2024-07-30 05:34:55,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1620/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 6.608319e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:55,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.66162 samples/s/p 0:35:26 } +2024-07-30 05:34:58,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1622/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 6.591165e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:58,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |█████████████████████████████████████████ | 5.66064 samples/s/p 0:35:24 } +2024-07-30 05:35:01,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1624/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 6.574032e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:01,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |█████████████████████████████████████████ | 5.65868 samples/s/p 0:35:22 } +2024-07-30 05:35:04,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1626/ 3125], loss: 0.105, per_step_time: 1414ms, lr: 6.55691e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:04,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.65736 samples/s/p 0:35:19 } +2024-07-30 05:35:07,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1628/ 3125], loss: 0.344, per_step_time: 1419ms, lr: 6.5398183e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:07,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.63502 samples/s/p 0:35:25 } +2024-07-30 05:35:09,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1630/ 3125], loss: 0.373, per_step_time: 1417ms, lr: 6.5227505e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:09,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.64368 samples/s/p 0:35:19 } +2024-07-30 05:35:12,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1632/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 6.505698e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:12,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.65899 samples/s/p 0:35:10 } +2024-07-30 05:35:15,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1634/ 3125], loss: 0.265, per_step_time: 1414ms, lr: 6.488666e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:15,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.65680 samples/s/p 0:35:08 } +2024-07-30 05:35:18,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1636/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 6.471661e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:18,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.66141 samples/s/p 0:35:04 } +2024-07-30 05:35:21,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1638/ 3125], loss: 0.127, per_step_time: 1412ms, lr: 6.4546646e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:21,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.66187 samples/s/p 0:35:01 } +2024-07-30 05:35:24,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1640/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 6.4376917e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:24,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.65891 samples/s/p 0:34:59 } +2024-07-30 05:35:26,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1642/ 3125], loss: 0.100, per_step_time: 1413ms, lr: 6.420746e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:26,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.66129 samples/s/p 0:34:55 } +2024-07-30 05:35:29,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1644/ 3125], loss: 0.177, per_step_time: 1415ms, lr: 6.4038187e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:29,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.65301 samples/s/p 0:34:55 } +2024-07-30 05:35:32,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1646/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 6.386912e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:32,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.66149 samples/s/p 0:34:49 } +2024-07-30 05:35:35,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1648/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 6.3700315e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:35,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.65926 samples/s/p 0:34:47 } +2024-07-30 05:35:38,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1650/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 6.3531667e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:38,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.66057 samples/s/p 0:34:44 } +2024-07-30 05:35:41,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1652/ 3125], loss: 0.159, per_step_time: 1412ms, lr: 6.336322e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:41,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.66233 samples/s/p 0:34:41 } +2024-07-30 05:35:43,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1654/ 3125], loss: 0.257, per_step_time: 1412ms, lr: 6.319502e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:43,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.66219 samples/s/p 0:34:38 } +2024-07-30 05:35:46,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1656/ 3125], loss: 0.157, per_step_time: 1412ms, lr: 6.3026965e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:46,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.66277 samples/s/p 0:34:35 } +2024-07-30 05:35:49,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1658/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 6.285912e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:49,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.65994 samples/s/p 0:34:33 } +2024-07-30 05:35:52,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1660/ 3125], loss: 0.242, per_step_time: 1412ms, lr: 6.269154e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:52,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.66230 samples/s/p 0:34:29 } +2024-07-30 05:35:55,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1662/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 6.2524106e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:55,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.65426 samples/s/p 0:34:29 } +2024-07-30 05:35:58,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1664/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 6.2356946e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:58,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.66020 samples/s/p 0:34:24 } +2024-07-30 05:36:00,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1666/ 3125], loss: 0.201, per_step_time: 1412ms, lr: 6.2189963e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:00,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.66219 samples/s/p 0:34:21 } +2024-07-30 05:36:03,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1668/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 6.202322e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:03,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.65817 samples/s/p 0:34:20 } +2024-07-30 05:36:06,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1670/ 3125], loss: 0.194, per_step_time: 1414ms, lr: 6.1856593e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:06,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.65763 samples/s/p 0:34:17 } +2024-07-30 05:36:09,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1672/ 3125], loss: 0.371, per_step_time: 1414ms, lr: 6.169027e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:09,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.65633 samples/s/p 0:34:15 } +2024-07-30 05:36:12,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1674/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 6.152415e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:12,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.65818 samples/s/p 0:34:11 } +2024-07-30 05:36:15,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1676/ 3125], loss: 0.320, per_step_time: 1414ms, lr: 6.135824e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:15,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.65679 samples/s/p 0:34:09 } +2024-07-30 05:36:17,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1678/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 6.119251e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:17,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.66153 samples/s/p 0:34:04 } +2024-07-30 05:36:20,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1680/ 3125], loss: 0.404, per_step_time: 1412ms, lr: 6.1026986e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:20,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.66192 samples/s/p 0:34:01 } +2024-07-30 05:36:23,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1682/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 6.0861674e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:23,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.65873 samples/s/p 0:34:00 } +2024-07-30 05:36:26,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1684/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 6.069654e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:26,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.65982 samples/s/p 0:33:56 } +2024-07-30 05:36:29,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1686/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 6.053165e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:29,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.66088 samples/s/p 0:33:53 } +2024-07-30 05:36:32,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1688/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 6.036699e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:32,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.66167 samples/s/p 0:33:50 } +2024-07-30 05:36:34,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1690/ 3125], loss: 0.472, per_step_time: 1412ms, lr: 6.0202535e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:34,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.66312 samples/s/p 0:33:47 } +2024-07-30 05:36:37,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1692/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 6.003827e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:37,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.65982 samples/s/p 0:33:45 } +2024-07-30 05:36:40,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1694/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 5.9874264e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:40,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.66140 samples/s/p 0:33:42 } +2024-07-30 05:36:43,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1696/ 3125], loss: 0.134, per_step_time: 1412ms, lr: 5.971044e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:43,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.66190 samples/s/p 0:33:39 } +2024-07-30 05:36:46,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1698/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 5.9546767e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:46,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.65974 samples/s/p 0:33:37 } +2024-07-30 05:36:49,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1700/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 5.938336e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:49,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.65992 samples/s/p 0:33:34 } +2024-07-30 05:36:51,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1702/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 5.922016e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:51,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.65873 samples/s/p 0:33:31 } +2024-07-30 05:36:54,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1704/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 5.9057203e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:54,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.66038 samples/s/p 0:33:28 } +2024-07-30 05:36:57,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1706/ 3125], loss: 0.215, per_step_time: 1414ms, lr: 5.8894364e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:57,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.65436 samples/s/p 0:33:27 } +2024-07-30 05:37:00,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1708/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 5.8731825e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:00,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.65893 samples/s/p 0:33:23 } +2024-07-30 05:37:03,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1710/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 5.856946e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:03,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.66139 samples/s/p 0:33:19 } +2024-07-30 05:37:06,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1712/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 5.8407306e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:06,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.65804 samples/s/p 0:33:17 } +2024-07-30 05:37:08,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1714/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 5.824533e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:08,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.66031 samples/s/p 0:33:14 } +2024-07-30 05:37:11,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1716/ 3125], loss: 0.192, per_step_time: 1414ms, lr: 5.8083623e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:11,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.65470 samples/s/p 0:33:13 } +2024-07-30 05:37:14,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1718/ 3125], loss: 0.193, per_step_time: 1414ms, lr: 5.792209e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:14,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.65572 samples/s/p 0:33:10 } +2024-07-30 05:37:17,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1720/ 3125], loss: 0.420, per_step_time: 1413ms, lr: 5.7760803e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:17,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.65895 samples/s/p 0:33:06 } +2024-07-30 05:37:20,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1722/ 3125], loss: 0.260, per_step_time: 1414ms, lr: 5.759972e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:20,245 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.65729 samples/s/p 0:33:03 } +2024-07-30 05:37:23,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1724/ 3125], loss: 0.136, per_step_time: 1414ms, lr: 5.7438876e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:23,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.65431 samples/s/p 0:33:02 } +2024-07-30 05:37:25,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1726/ 3125], loss: 0.655, per_step_time: 1415ms, lr: 5.7278123e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:25,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.65309 samples/s/p 0:32:59 } +2024-07-30 05:37:28,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1728/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 5.71177e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:28,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.66083 samples/s/p 0:32:54 } +2024-07-30 05:37:31,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1730/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 5.6957424e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:31,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.66074 samples/s/p 0:32:51 } +2024-07-30 05:37:34,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1732/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 5.6797353e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:34,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.66029 samples/s/p 0:32:48 } +2024-07-30 05:37:37,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1734/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 5.6637555e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:37,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.66059 samples/s/p 0:32:45 } +2024-07-30 05:37:40,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1736/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 5.647793e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:40,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.66104 samples/s/p 0:32:42 } +2024-07-30 05:37:42,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1738/ 3125], loss: 0.089, per_step_time: 1413ms, lr: 5.631855e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:42,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.66113 samples/s/p 0:32:40 } +2024-07-30 05:37:45,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1740/ 3125], loss: 0.575, per_step_time: 1412ms, lr: 5.6159377e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:45,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.66259 samples/s/p 0:32:36 } +2024-07-30 05:37:48,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1742/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 5.600035e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:48,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.66054 samples/s/p 0:32:34 } +2024-07-30 05:37:51,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1744/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 5.5841593e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:51,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.66151 samples/s/p 0:32:31 } +2024-07-30 05:37:54,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1746/ 3125], loss: 0.254, per_step_time: 1412ms, lr: 5.5683046e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:54,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.66329 samples/s/p 0:32:27 } +2024-07-30 05:37:57,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1748/ 3125], loss: 0.137, per_step_time: 1413ms, lr: 5.5524737e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:57,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.66010 samples/s/p 0:32:26 } +2024-07-30 05:37:59,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1750/ 3125], loss: 0.195, per_step_time: 1414ms, lr: 5.536655e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:59,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.65573 samples/s/p 0:32:24 } +2024-07-30 05:38:02,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1752/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 5.5208653e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:02,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.66142 samples/s/p 0:32:20 } +2024-07-30 05:38:05,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1754/ 3125], loss: 0.277, per_step_time: 1412ms, lr: 5.505097e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:05,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.66249 samples/s/p 0:32:16 } +2024-07-30 05:38:08,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1756/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 5.4893405e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:08,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.65877 samples/s/p 0:32:15 } +2024-07-30 05:38:11,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1758/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 5.4736165e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:11,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.66008 samples/s/p 0:32:12 } +2024-07-30 05:38:14,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1760/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 5.457908e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:14,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.66105 samples/s/p 0:32:08 } +2024-07-30 05:38:16,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1762/ 3125], loss: 0.158, per_step_time: 1413ms, lr: 5.442223e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:16,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.65775 samples/s/p 0:32:07 } +2024-07-30 05:38:19,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1764/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 5.4265615e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:19,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.66097 samples/s/p 0:32:03 } +2024-07-30 05:38:22,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1766/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 5.4109216e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:22,589 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.66005 samples/s/p 0:32:00 } +2024-07-30 05:38:25,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1768/ 3125], loss: 0.316, per_step_time: 1412ms, lr: 5.395296e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:25,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.66240 samples/s/p 0:31:57 } +2024-07-30 05:38:28,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1770/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 5.379692e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:28,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.66096 samples/s/p 0:31:54 } +2024-07-30 05:38:31,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1772/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 5.364117e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:31,089 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.66020 samples/s/p 0:31:52 } +2024-07-30 05:38:33,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1774/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 5.3485513e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:33,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.66011 samples/s/p 0:31:49 } +2024-07-30 05:38:36,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1776/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 5.333021e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:36,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.66098 samples/s/p 0:31:46 } +2024-07-30 05:38:39,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1778/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 5.317503e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:39,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.65924 samples/s/p 0:31:44 } +2024-07-30 05:38:42,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1780/ 3125], loss: 0.378, per_step_time: 1414ms, lr: 5.302012e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:42,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.65725 samples/s/p 0:31:41 } +2024-07-30 05:38:45,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1782/ 3125], loss: 0.191, per_step_time: 1414ms, lr: 5.2865414e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:45,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.65390 samples/s/p 0:31:40 } +2024-07-30 05:38:48,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1784/ 3125], loss: 0.450, per_step_time: 1413ms, lr: 5.271089e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:48,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.65999 samples/s/p 0:31:35 } +2024-07-30 05:38:50,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1786/ 3125], loss: 0.255, per_step_time: 1412ms, lr: 5.2556544e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:50,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.66269 samples/s/p 0:31:31 } +2024-07-30 05:38:53,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1788/ 3125], loss: 0.179, per_step_time: 1415ms, lr: 5.240249e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:53,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.65288 samples/s/p 0:31:32 } +2024-07-30 05:38:56,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1790/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 5.2248623e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:56,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.66099 samples/s/p 0:31:26 } +2024-07-30 05:38:59,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1792/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 5.2094964e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:59,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.65992 samples/s/p 0:31:24 } +2024-07-30 05:39:02,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1794/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 5.194148e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:02,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.65918 samples/s/p 0:31:21 } +2024-07-30 05:39:05,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1796/ 3125], loss: 0.381, per_step_time: 1414ms, lr: 5.178827e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:05,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.65758 samples/s/p 0:31:19 } +2024-07-30 05:39:07,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1798/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 5.1635266e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:07,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.66075 samples/s/p 0:31:15 } +2024-07-30 05:39:10,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1800/ 3125], loss: 0.104, per_step_time: 1413ms, lr: 5.1482436e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:10,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.66102 samples/s/p 0:31:12 } +2024-07-30 05:39:13,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1802/ 3125], loss: 0.427, per_step_time: 1414ms, lr: 5.132985e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:13,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.65763 samples/s/p 0:31:10 } +2024-07-30 05:39:16,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1804/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 5.11775e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:16,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.66052 samples/s/p 0:31:06 } +2024-07-30 05:39:19,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1806/ 3125], loss: 0.253, per_step_time: 1414ms, lr: 5.102533e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:19,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.65518 samples/s/p 0:31:05 } +2024-07-30 05:39:22,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1808/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 5.08734e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:22,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.65780 samples/s/p 0:31:02 } +2024-07-30 05:39:24,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1810/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 5.072167e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:24,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.66142 samples/s/p 0:30:58 } +2024-07-30 05:39:27,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1812/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 5.057019e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:27,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.65941 samples/s/p 0:30:56 } +2024-07-30 05:39:30,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1814/ 3125], loss: 0.128, per_step_time: 1414ms, lr: 5.0418885e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:30,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |███████████████████████████████████████████ | 5.65535 samples/s/p 0:30:54 } +2024-07-30 05:39:33,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1816/ 3125], loss: 0.300, per_step_time: 1414ms, lr: 5.0267784e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:33,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |███████████████████████████████████████████ | 5.65737 samples/s/p 0:30:51 } +2024-07-30 05:39:36,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1818/ 3125], loss: 0.304, per_step_time: 1414ms, lr: 5.0116836e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:36,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.65594 samples/s/p 0:30:48 } +2024-07-30 05:39:39,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1820/ 3125], loss: 0.252, per_step_time: 1415ms, lr: 4.996621e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:39,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.65224 samples/s/p 0:30:47 } +2024-07-30 05:39:41,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1822/ 3125], loss: 0.149, per_step_time: 1414ms, lr: 4.981577e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:41,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.65437 samples/s/p 0:30:43 } +2024-07-30 05:39:44,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1824/ 3125], loss: 0.332, per_step_time: 1414ms, lr: 4.966557e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:44,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.65603 samples/s/p 0:30:40 } +2024-07-30 05:39:47,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1826/ 3125], loss: 0.327, per_step_time: 1414ms, lr: 4.9515575e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:47,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.65653 samples/s/p 0:30:37 } +2024-07-30 05:39:50,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1828/ 3125], loss: 0.129, per_step_time: 1415ms, lr: 4.936573e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:50,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.64974 samples/s/p 0:30:36 } +2024-07-30 05:39:53,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1830/ 3125], loss: 0.336, per_step_time: 1414ms, lr: 4.921615e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:53,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.65546 samples/s/p 0:30:31 } +2024-07-30 05:39:56,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1832/ 3125], loss: 0.366, per_step_time: 1415ms, lr: 4.906681e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:56,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.65291 samples/s/p 0:30:29 } +2024-07-30 05:39:58,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1834/ 3125], loss: 0.434, per_step_time: 1414ms, lr: 4.891765e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:58,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.65486 samples/s/p 0:30:26 } +2024-07-30 05:40:01,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1836/ 3125], loss: 0.215, per_step_time: 1415ms, lr: 4.8768726e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:01,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.65324 samples/s/p 0:30:24 } +2024-07-30 05:40:04,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1838/ 3125], loss: 0.347, per_step_time: 1416ms, lr: 4.8619955e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:04,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.64918 samples/s/p 0:30:22 } +2024-07-30 05:40:07,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1840/ 3125], loss: 0.267, per_step_time: 1414ms, lr: 4.847148e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:07,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.65391 samples/s/p 0:30:18 } +2024-07-30 05:40:10,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1842/ 3125], loss: 0.263, per_step_time: 1414ms, lr: 4.8323153e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:10,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.65609 samples/s/p 0:30:14 } +2024-07-30 05:40:13,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1844/ 3125], loss: 0.343, per_step_time: 1414ms, lr: 4.8175065e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:13,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.65601 samples/s/p 0:30:11 } +2024-07-30 05:40:15,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1846/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 4.802728e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:15,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.66003 samples/s/p 0:30:07 } +2024-07-30 05:40:18,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1848/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 4.7879604e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:18,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.66071 samples/s/p 0:30:04 } +2024-07-30 05:40:21,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1850/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 4.7732203e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:21,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.66084 samples/s/p 0:30:01 } +2024-07-30 05:40:24,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1852/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 4.758501e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:24,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.65947 samples/s/p 0:29:59 } +2024-07-30 05:40:27,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1854/ 3125], loss: 0.448, per_step_time: 1413ms, lr: 4.7438024e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:27,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.66147 samples/s/p 0:29:56 } +2024-07-30 05:40:30,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1856/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 4.7291277e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:30,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.66125 samples/s/p 0:29:53 } +2024-07-30 05:40:32,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1858/ 3125], loss: 0.332, per_step_time: 1414ms, lr: 4.714465e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:32,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.65762 samples/s/p 0:29:51 } +2024-07-30 05:40:35,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1860/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 4.699832e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:35,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.65931 samples/s/p 0:29:48 } +2024-07-30 05:40:38,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1862/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 4.685214e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:38,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.65829 samples/s/p 0:29:45 } +2024-07-30 05:40:41,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1864/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 4.670626e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:41,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.65942 samples/s/p 0:29:42 } +2024-07-30 05:40:44,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1866/ 3125], loss: 0.310, per_step_time: 1414ms, lr: 4.6560555e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:44,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.65668 samples/s/p 0:29:40 } +2024-07-30 05:40:47,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1868/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 4.641509e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:47,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.65957 samples/s/p 0:29:36 } +2024-07-30 05:40:50,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1870/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 4.6269832e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:50,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.65876 samples/s/p 0:29:34 } +2024-07-30 05:40:52,840 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1872/ 3125], loss: 0.387, per_step_time: 1413ms, lr: 4.6124725e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:52,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.66048 samples/s/p 0:29:30 } +2024-07-30 05:40:55,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1874/ 3125], loss: 0.357, per_step_time: 1412ms, lr: 4.5979917e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:55,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.66229 samples/s/p 0:29:27 } +2024-07-30 05:40:58,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1876/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 4.5835316e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:58,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.66071 samples/s/p 0:29:25 } +2024-07-30 05:41:01,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1878/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 4.5690953e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:01,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.66161 samples/s/p 0:29:22 } +2024-07-30 05:41:04,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1880/ 3125], loss: 0.405, per_step_time: 1413ms, lr: 4.554677e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:04,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.65870 samples/s/p 0:29:20 } +2024-07-30 05:41:07,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1882/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 4.5402763e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:07,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.65963 samples/s/p 0:29:17 } +2024-07-30 05:41:09,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1884/ 3125], loss: 0.185, per_step_time: 1414ms, lr: 4.5259057e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:09,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.65641 samples/s/p 0:29:15 } +2024-07-30 05:41:12,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1886/ 3125], loss: 0.212, per_step_time: 1414ms, lr: 4.51155e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:12,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.65485 samples/s/p 0:29:12 } +2024-07-30 05:41:15,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1888/ 3125], loss: 0.370, per_step_time: 1414ms, lr: 4.497218e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:15,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.65589 samples/s/p 0:29:09 } +2024-07-30 05:41:18,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1890/ 3125], loss: 0.436, per_step_time: 1413ms, lr: 4.482907e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:18,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.66110 samples/s/p 0:29:05 } +2024-07-30 05:41:21,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1892/ 3125], loss: 0.427, per_step_time: 1413ms, lr: 4.4686226e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:21,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.66016 samples/s/p 0:29:02 } +2024-07-30 05:41:24,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1894/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 4.4543594e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:24,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.65859 samples/s/p 0:29:00 } +2024-07-30 05:41:26,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1896/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 4.440114e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:26,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.65838 samples/s/p 0:28:57 } +2024-07-30 05:41:29,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1898/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 4.4258923e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:29,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.65987 samples/s/p 0:28:54 } +2024-07-30 05:41:32,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1900/ 3125], loss: 0.282, per_step_time: 1425ms, lr: 4.4116854e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:32,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.61334 samples/s/p 0:29:05 } +2024-07-30 05:41:35,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1902/ 3125], loss: 0.268, per_step_time: 1413ms, lr: 4.3975083e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:35,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.66130 samples/s/p 0:28:48 } +2024-07-30 05:41:38,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1904/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 4.3833552e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:38,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.65965 samples/s/p 0:28:45 } +2024-07-30 05:41:41,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1906/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 4.369217e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:41,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.66130 samples/s/p 0:28:42 } +2024-07-30 05:41:43,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1908/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 4.3550997e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:43,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.66057 samples/s/p 0:28:39 } +2024-07-30 05:41:46,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1910/ 3125], loss: 0.236, per_step_time: 1412ms, lr: 4.3410122e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:46,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.66264 samples/s/p 0:28:36 } +2024-07-30 05:41:49,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1912/ 3125], loss: 0.141, per_step_time: 1413ms, lr: 4.3269455e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:49,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.65946 samples/s/p 0:28:34 } +2024-07-30 05:41:52,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1914/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 4.3128907e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:52,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.66139 samples/s/p 0:28:31 } +2024-07-30 05:41:55,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1916/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 4.2988657e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:55,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.66010 samples/s/p 0:28:28 } +2024-07-30 05:41:58,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1918/ 3125], loss: 0.416, per_step_time: 1413ms, lr: 4.2848615e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:58,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.66167 samples/s/p 0:28:25 } +2024-07-30 05:42:00,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1920/ 3125], loss: 0.474, per_step_time: 1413ms, lr: 4.2708783e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:00,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.66091 samples/s/p 0:28:22 } +2024-07-30 05:42:03,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1922/ 3125], loss: 0.104, per_step_time: 1413ms, lr: 4.2569218e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:03,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.66111 samples/s/p 0:28:20 } +2024-07-30 05:42:06,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1924/ 3125], loss: 0.437, per_step_time: 1413ms, lr: 4.2429835e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:06,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.65963 samples/s/p 0:28:17 } +2024-07-30 05:42:09,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1926/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 4.2290628e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:09,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.65859 samples/s/p 0:28:15 } +2024-07-30 05:42:12,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1928/ 3125], loss: 0.454, per_step_time: 1412ms, lr: 4.215169e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:12,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.66186 samples/s/p 0:28:11 } +2024-07-30 05:42:15,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1930/ 3125], loss: 0.215, per_step_time: 1412ms, lr: 4.20129e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:15,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.66256 samples/s/p 0:28:08 } +2024-07-30 05:42:17,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1932/ 3125], loss: 0.346, per_step_time: 1413ms, lr: 4.1874407e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:17,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.66168 samples/s/p 0:28:05 } +2024-07-30 05:42:20,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1934/ 3125], loss: 0.110, per_step_time: 1414ms, lr: 4.1736124e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:20,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.65743 samples/s/p 0:28:04 } +2024-07-30 05:42:23,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1936/ 3125], loss: 0.433, per_step_time: 1413ms, lr: 4.159802e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:23,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.65801 samples/s/p 0:28:01 } +2024-07-30 05:42:26,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1938/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 4.1460186e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:26,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.65825 samples/s/p 0:27:58 } +2024-07-30 05:42:29,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1940/ 3125], loss: 0.112, per_step_time: 1413ms, lr: 4.132256e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:29,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.66134 samples/s/p 0:27:54 } +2024-07-30 05:42:32,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1942/ 3125], loss: 0.137, per_step_time: 1415ms, lr: 4.118514e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:32,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.65184 samples/s/p 0:27:54 } +2024-07-30 05:42:34,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1944/ 3125], loss: 0.308, per_step_time: 1414ms, lr: 4.10479e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:34,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.65746 samples/s/p 0:27:50 } +2024-07-30 05:42:37,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1946/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 4.091096e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:37,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.65970 samples/s/p 0:27:46 } +2024-07-30 05:42:40,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1948/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 4.0774196e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:40,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.66029 samples/s/p 0:27:43 } +2024-07-30 05:42:43,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1950/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 4.063761e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:43,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.65844 samples/s/p 0:27:41 } +2024-07-30 05:42:46,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1952/ 3125], loss: 0.390, per_step_time: 1413ms, lr: 4.0501297e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:46,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.65951 samples/s/p 0:27:38 } +2024-07-30 05:42:49,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1954/ 3125], loss: 0.410, per_step_time: 1413ms, lr: 4.0365188e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:49,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.66116 samples/s/p 0:27:34 } +2024-07-30 05:42:51,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1956/ 3125], loss: 0.320, per_step_time: 1412ms, lr: 4.0229318e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:51,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.66203 samples/s/p 0:27:31 } +2024-07-30 05:42:54,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1958/ 3125], loss: 0.266, per_step_time: 1412ms, lr: 4.00936e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:54,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.66258 samples/s/p 0:27:28 } +2024-07-30 05:42:57,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1960/ 3125], loss: 0.147, per_step_time: 1418ms, lr: 3.995821e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:57,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.63819 samples/s/p 0:27:33 } +2024-07-30 05:43:00,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1962/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 3.9822964e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:00,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.66026 samples/s/p 0:27:23 } +2024-07-30 05:43:03,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1964/ 3125], loss: 0.287, per_step_time: 1412ms, lr: 3.968799e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:03,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.66325 samples/s/p 0:27:20 } +2024-07-30 05:43:06,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1966/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 3.9553166e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:06,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.66009 samples/s/p 0:27:18 } +2024-07-30 05:43:08,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1968/ 3125], loss: 0.158, per_step_time: 1413ms, lr: 3.9418606e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:08,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.65997 samples/s/p 0:27:15 } +2024-07-30 05:43:11,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1970/ 3125], loss: 0.176, per_step_time: 1413ms, lr: 3.9284288e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:11,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.65876 samples/s/p 0:27:12 } +2024-07-30 05:43:14,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1972/ 3125], loss: 0.169, per_step_time: 1413ms, lr: 3.9150117e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:14,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.65924 samples/s/p 0:27:09 } +2024-07-30 05:43:17,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1974/ 3125], loss: 0.306, per_step_time: 1415ms, lr: 3.9016186e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:17,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.65237 samples/s/p 0:27:09 } +2024-07-30 05:43:20,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1976/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 3.888252e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:20,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.66129 samples/s/p 0:27:03 } +2024-07-30 05:43:23,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1978/ 3125], loss: 0.349, per_step_time: 1413ms, lr: 3.874904e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:23,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.66015 samples/s/p 0:27:01 } +2024-07-30 05:43:25,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1980/ 3125], loss: 0.322, per_step_time: 1413ms, lr: 3.8615792e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:25,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.66158 samples/s/p 0:26:57 } +2024-07-30 05:43:28,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1982/ 3125], loss: 0.388, per_step_time: 1413ms, lr: 3.8482784e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:28,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.65953 samples/s/p 0:26:55 } +2024-07-30 05:43:31,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1984/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 3.8349955e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:31,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.65992 samples/s/p 0:26:52 } +2024-07-30 05:43:34,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1986/ 3125], loss: 0.249, per_step_time: 1416ms, lr: 3.8217425e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:34,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.64757 samples/s/p 0:26:53 } +2024-07-30 05:43:37,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1988/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 3.8085014e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:37,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.66092 samples/s/p 0:26:46 } +2024-07-30 05:43:40,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1990/ 3125], loss: 0.203, per_step_time: 1414ms, lr: 3.795287e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:40,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.65416 samples/s/p 0:26:45 } +2024-07-30 05:43:42,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1992/ 3125], loss: 0.162, per_step_time: 1412ms, lr: 3.7820934e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:42,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.66208 samples/s/p 0:26:40 } +2024-07-30 05:43:45,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1994/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 3.7689267e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:45,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.66094 samples/s/p 0:26:38 } +2024-07-30 05:43:48,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1996/ 3125], loss: 0.317, per_step_time: 1414ms, lr: 3.755772e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:48,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |███████████████████████████████████████████ | 5.65712 samples/s/p 0:26:36 } +2024-07-30 05:43:51,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1998/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 3.7426472e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:51,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |███████████████████████████████████████████ | 5.65787 samples/s/p 0:26:33 } +2024-07-30 05:43:54,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2000/ 3125], loss: 0.219, per_step_time: 1414ms, lr: 3.729546e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:54,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.65750 samples/s/p 0:26:30 } +2024-07-30 05:43:57,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2002/ 3125], loss: 0.322, per_step_time: 1414ms, lr: 3.7164597e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:57,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.65726 samples/s/p 0:26:28 } +2024-07-30 05:43:59,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2004/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 3.7034005e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:59,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.66094 samples/s/p 0:26:24 } +2024-07-30 05:44:02,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2006/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 3.690362e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:02,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.65933 samples/s/p 0:26:21 } +2024-07-30 05:44:05,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2008/ 3125], loss: 0.410, per_step_time: 1412ms, lr: 3.677347e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:05,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.66224 samples/s/p 0:26:18 } +2024-07-30 05:44:08,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2010/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 3.6643564e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:08,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.66120 samples/s/p 0:26:15 } +2024-07-30 05:44:11,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2012/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 3.6513865e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:11,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.65787 samples/s/p 0:26:13 } +2024-07-30 05:44:14,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2014/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 3.6384372e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:14,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.66033 samples/s/p 0:26:10 } +2024-07-30 05:44:16,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2016/ 3125], loss: 0.380, per_step_time: 1412ms, lr: 3.625506e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:16,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.66250 samples/s/p 0:26:06 } +2024-07-30 05:44:19,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2018/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 3.6126016e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:19,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.65969 samples/s/p 0:26:04 } +2024-07-30 05:44:22,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2020/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 3.599718e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:22,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.66091 samples/s/p 0:26:01 } +2024-07-30 05:44:25,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2022/ 3125], loss: 0.103, per_step_time: 1413ms, lr: 3.5868555e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:25,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.66111 samples/s/p 0:25:58 } +2024-07-30 05:44:28,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2024/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 3.5740166e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:28,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.66166 samples/s/p 0:25:55 } +2024-07-30 05:44:31,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2026/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 3.5612015e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:31,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.66085 samples/s/p 0:25:53 } +2024-07-30 05:44:33,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2028/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 3.5484044e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:33,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.65889 samples/s/p 0:25:50 } +2024-07-30 05:44:36,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2030/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 3.535631e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:36,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.66082 samples/s/p 0:25:47 } +2024-07-30 05:44:39,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2032/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 3.5228848e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:39,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.66012 samples/s/p 0:25:44 } +2024-07-30 05:44:42,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2034/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 3.5101561e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:42,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.66060 samples/s/p 0:25:41 } +2024-07-30 05:44:45,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2036/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 3.4974514e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:45,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.66030 samples/s/p 0:25:39 } +2024-07-30 05:44:48,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2038/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 3.4847704e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:48,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.66045 samples/s/p 0:25:36 } +2024-07-30 05:44:50,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2040/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 3.4721046e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:50,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.65945 samples/s/p 0:25:33 } +2024-07-30 05:44:53,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2042/ 3125], loss: 0.288, per_step_time: 1414ms, lr: 3.4594655e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:53,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.65667 samples/s/p 0:25:31 } +2024-07-30 05:44:56,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2044/ 3125], loss: 0.271, per_step_time: 1414ms, lr: 3.446847e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:56,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.65749 samples/s/p 0:25:28 } +2024-07-30 05:44:59,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2046/ 3125], loss: 0.145, per_step_time: 1414ms, lr: 3.4342526e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:59,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.65646 samples/s/p 0:25:26 } +2024-07-30 05:45:02,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2048/ 3125], loss: 0.373, per_step_time: 1412ms, lr: 3.421682e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:02,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.66199 samples/s/p 0:25:21 } +2024-07-30 05:45:05,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2050/ 3125], loss: 0.396, per_step_time: 1413ms, lr: 3.4091323e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:05,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.65968 samples/s/p 0:25:19 } +2024-07-30 05:45:07,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2052/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 3.3966063e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:07,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.65972 samples/s/p 0:25:16 } +2024-07-30 05:45:10,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2054/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 3.3841013e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:10,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.65907 samples/s/p 0:25:14 } +2024-07-30 05:45:13,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2056/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 3.3716202e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:13,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.66042 samples/s/p 0:25:10 } +2024-07-30 05:45:16,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2058/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 3.3591598e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:16,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.65736 samples/s/p 0:25:08 } +2024-07-30 05:45:19,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2060/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 3.3467143e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:19,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.65905 samples/s/p 0:25:05 } +2024-07-30 05:45:22,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2062/ 3125], loss: 0.276, per_step_time: 1418ms, lr: 3.3342985e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:22,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.64113 samples/s/p 0:25:07 } +2024-07-30 05:45:24,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2064/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 3.321907e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:24,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.66144 samples/s/p 0:24:59 } +2024-07-30 05:45:27,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2066/ 3125], loss: 0.146, per_step_time: 1412ms, lr: 3.30953e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:27,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.66245 samples/s/p 0:24:56 } +2024-07-30 05:45:30,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2068/ 3125], loss: 0.238, per_step_time: 1417ms, lr: 3.297183e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:30,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.64299 samples/s/p 0:24:58 } +2024-07-30 05:45:33,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2070/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 3.2848595e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:33,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.66057 samples/s/p 0:24:51 } +2024-07-30 05:45:36,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2072/ 3125], loss: 0.483, per_step_time: 1413ms, lr: 3.272554e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:36,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.65781 samples/s/p 0:24:48 } +2024-07-30 05:45:39,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2074/ 3125], loss: 0.392, per_step_time: 1415ms, lr: 3.2602668e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:39,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.65081 samples/s/p 0:24:47 } +2024-07-30 05:45:41,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2076/ 3125], loss: 0.204, per_step_time: 1414ms, lr: 3.248009e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:41,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.65741 samples/s/p 0:24:43 } +2024-07-30 05:45:44,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2078/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 3.2357693e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:44,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.65828 samples/s/p 0:24:40 } +2024-07-30 05:45:47,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2080/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 3.2235562e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:47,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.66164 samples/s/p 0:24:36 } +2024-07-30 05:45:50,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2082/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 3.211364e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:50,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.66118 samples/s/p 0:24:33 } +2024-07-30 05:45:53,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2084/ 3125], loss: 0.415, per_step_time: 1413ms, lr: 3.19919e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:53,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.65879 samples/s/p 0:24:31 } +2024-07-30 05:45:56,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2086/ 3125], loss: 0.434, per_step_time: 1412ms, lr: 3.1870425e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:56,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.66290 samples/s/p 0:24:27 } +2024-07-30 05:45:58,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2088/ 3125], loss: 0.105, per_step_time: 1413ms, lr: 3.17491e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:58,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.66027 samples/s/p 0:24:25 } +2024-07-30 05:46:01,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2090/ 3125], loss: 0.137, per_step_time: 1412ms, lr: 3.1628102e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:01,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.66259 samples/s/p 0:24:22 } +2024-07-30 05:46:04,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2092/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 3.1507284e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:04,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.65814 samples/s/p 0:24:20 } +2024-07-30 05:46:07,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2094/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 3.1386702e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:07,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.65870 samples/s/p 0:24:17 } +2024-07-30 05:46:10,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2096/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 3.126633e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:10,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.66166 samples/s/p 0:24:13 } +2024-07-30 05:46:13,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2098/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 3.1146197e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:13,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.66010 samples/s/p 0:24:11 } +2024-07-30 05:46:15,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2100/ 3125], loss: 0.144, per_step_time: 1414ms, lr: 3.1026272e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:15,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.65592 samples/s/p 0:24:09 } +2024-07-30 05:46:18,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2102/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 3.0906529e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:18,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.65801 samples/s/p 0:24:06 } +2024-07-30 05:46:21,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2104/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 3.078708e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:21,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.65939 samples/s/p 0:24:03 } +2024-07-30 05:46:24,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2106/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 3.066784e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:24,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.66090 samples/s/p 0:24:00 } +2024-07-30 05:46:27,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2108/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 3.0548782e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:27,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.65869 samples/s/p 0:23:57 } +2024-07-30 05:46:30,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2110/ 3125], loss: 0.341, per_step_time: 1413ms, lr: 3.0429987e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:30,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.66057 samples/s/p 0:23:54 } +2024-07-30 05:46:32,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2112/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 3.0311435e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:32,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.65896 samples/s/p 0:23:52 } +2024-07-30 05:46:35,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2114/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 3.019309e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:35,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.65971 samples/s/p 0:23:49 } +2024-07-30 05:46:38,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2116/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 3.0074892e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:38,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.66113 samples/s/p 0:23:45 } +2024-07-30 05:46:41,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2118/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 2.9957056e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:41,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.65960 samples/s/p 0:23:43 } +2024-07-30 05:46:44,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2120/ 3125], loss: 0.374, per_step_time: 1414ms, lr: 2.9839336e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:44,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.65629 samples/s/p 0:23:41 } +2024-07-30 05:46:47,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2122/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 2.9721915e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:47,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.65973 samples/s/p 0:23:37 } +2024-07-30 05:46:49,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2124/ 3125], loss: 0.254, per_step_time: 1412ms, lr: 2.9604672e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:49,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.66281 samples/s/p 0:23:34 } +2024-07-30 05:46:52,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2126/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 2.94877e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:52,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.66106 samples/s/p 0:23:31 } +2024-07-30 05:46:55,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2128/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 2.9370904e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:55,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.66066 samples/s/p 0:23:29 } +2024-07-30 05:46:58,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2130/ 3125], loss: 0.234, per_step_time: 1412ms, lr: 2.9254346e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:58,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.66181 samples/s/p 0:23:25 } +2024-07-30 05:47:01,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2132/ 3125], loss: 0.417, per_step_time: 1414ms, lr: 2.9138e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:01,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.65754 samples/s/p 0:23:24 } +2024-07-30 05:47:04,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2134/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 2.9021888e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:04,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.65868 samples/s/p 0:23:21 } +2024-07-30 05:47:06,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2136/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 2.8905987e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:06,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.65970 samples/s/p 0:23:17 } +2024-07-30 05:47:09,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2138/ 3125], loss: 0.503, per_step_time: 1413ms, lr: 2.8790353e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:09,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.65996 samples/s/p 0:23:15 } +2024-07-30 05:47:12,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2140/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 2.8674899e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:12,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.65791 samples/s/p 0:23:12 } +2024-07-30 05:47:15,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2142/ 3125], loss: 0.380, per_step_time: 1413ms, lr: 2.8559742e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:15,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.65814 samples/s/p 0:23:09 } +2024-07-30 05:47:18,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2144/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 2.8444765e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:18,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.65786 samples/s/p 0:23:07 } +2024-07-30 05:47:21,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2146/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 2.8329998e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:21,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.65980 samples/s/p 0:23:03 } +2024-07-30 05:47:23,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2148/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 2.8215436e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:23,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.65912 samples/s/p 0:23:01 } +2024-07-30 05:47:26,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2150/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 2.8101147e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:26,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.66032 samples/s/p 0:22:58 } +2024-07-30 05:47:26,827 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 05:48:03,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2152/ 3125], loss: 0.418, per_step_time: 3103ms, lr: 2.7987033e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:03,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 2.57747 samples/s/p 0:50:20 } +2024-07-30 05:48:06,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2154/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 2.7873187e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:06,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.66137 samples/s/p 0:22:52 } +2024-07-30 05:48:08,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2156/ 3125], loss: 0.291, per_step_time: 1413ms, lr: 2.7759552e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:08,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.65921 samples/s/p 0:22:49 } +2024-07-30 05:48:11,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2158/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 2.7646155e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:11,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.65987 samples/s/p 0:22:46 } +2024-07-30 05:48:14,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2160/ 3125], loss: 0.600, per_step_time: 1413ms, lr: 2.7532965e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:14,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.65857 samples/s/p 0:22:44 } +2024-07-30 05:48:17,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2162/ 3125], loss: 0.405, per_step_time: 1413ms, lr: 2.7420015e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:17,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.65854 samples/s/p 0:22:41 } +2024-07-30 05:48:20,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2164/ 3125], loss: 0.299, per_step_time: 1414ms, lr: 2.7307271e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:20,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.65626 samples/s/p 0:22:39 } +2024-07-30 05:48:23,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2166/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 2.7194767e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:23,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.66046 samples/s/p 0:22:35 } +2024-07-30 05:48:25,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2168/ 3125], loss: 0.133, per_step_time: 1414ms, lr: 2.7082532e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:25,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.65551 samples/s/p 0:22:33 } +2024-07-30 05:48:28,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2170/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 2.6970474e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:28,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.65727 samples/s/p 0:22:30 } +2024-07-30 05:48:31,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2172/ 3125], loss: 0.375, per_step_time: 1414ms, lr: 2.6858626e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:31,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.65755 samples/s/p 0:22:27 } +2024-07-30 05:48:34,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2174/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 2.6747017e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:34,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.66105 samples/s/p 0:22:23 } +2024-07-30 05:48:37,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2176/ 3125], loss: 0.295, per_step_time: 1412ms, lr: 2.6635615e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:37,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.66173 samples/s/p 0:22:20 } +2024-07-30 05:48:40,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2178/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 2.6524512e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:40,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.65977 samples/s/p 0:22:18 } +2024-07-30 05:48:42,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2180/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 2.641356e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:42,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.65936 samples/s/p 0:22:15 } +2024-07-30 05:48:45,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2182/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 2.6302874e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:45,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.65984 samples/s/p 0:22:12 } +2024-07-30 05:48:48,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2184/ 3125], loss: 0.419, per_step_time: 1413ms, lr: 2.6192455e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:48,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |████████████████████████████████████████████ | 5.65806 samples/s/p 0:22:10 } +2024-07-30 05:48:51,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2186/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 2.6082188e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:51,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |████████████████████████████████████████████ | 5.66094 samples/s/p 0:22:06 } +2024-07-30 05:48:54,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2188/ 3125], loss: 0.160, per_step_time: 1415ms, lr: 2.5972128e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:54,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.65264 samples/s/p 0:22:06 } +2024-07-30 05:48:57,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2190/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 2.5862366e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:57,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.66085 samples/s/p 0:22:01 } +2024-07-30 05:48:59,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2192/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 2.5752811e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:59,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.66135 samples/s/p 0:21:58 } +2024-07-30 05:49:02,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2194/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 2.5643467e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:02,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.66096 samples/s/p 0:21:55 } +2024-07-30 05:49:05,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2196/ 3125], loss: 0.307, per_step_time: 1412ms, lr: 2.553433e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:05,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.66201 samples/s/p 0:21:52 } +2024-07-30 05:49:08,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2198/ 3125], loss: 0.243, per_step_time: 1414ms, lr: 2.5425493e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:08,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.65602 samples/s/p 0:21:51 } +2024-07-30 05:49:11,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2200/ 3125], loss: 0.187, per_step_time: 1414ms, lr: 2.5316834e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:11,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.65700 samples/s/p 0:21:48 } +2024-07-30 05:49:14,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2202/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 2.5208382e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:14,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.65942 samples/s/p 0:21:44 } +2024-07-30 05:49:16,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2204/ 3125], loss: 0.325, per_step_time: 1414ms, lr: 2.5100172e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:16,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.65715 samples/s/p 0:21:42 } +2024-07-30 05:49:19,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2206/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 2.4992198e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:19,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.66154 samples/s/p 0:21:38 } +2024-07-30 05:49:22,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2208/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 2.4884463e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:22,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.65994 samples/s/p 0:21:36 } +2024-07-30 05:49:25,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2210/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 2.4776935e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:25,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.65974 samples/s/p 0:21:33 } +2024-07-30 05:49:28,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2212/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 2.4669646e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:28,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.65925 samples/s/p 0:21:30 } +2024-07-30 05:49:31,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2214/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 2.4562596e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:31,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.65858 samples/s/p 0:21:27 } +2024-07-30 05:49:33,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2216/ 3125], loss: 0.425, per_step_time: 1414ms, lr: 2.4455724e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:33,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.65671 samples/s/p 0:21:25 } +2024-07-30 05:49:36,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2218/ 3125], loss: 0.370, per_step_time: 1415ms, lr: 2.4349092e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:36,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.65313 samples/s/p 0:21:23 } +2024-07-30 05:49:39,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2220/ 3125], loss: 0.275, per_step_time: 1412ms, lr: 2.424267e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:39,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.66178 samples/s/p 0:21:18 } +2024-07-30 05:49:42,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2222/ 3125], loss: 0.233, per_step_time: 1414ms, lr: 2.4136511e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:42,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.65527 samples/s/p 0:21:17 } +2024-07-30 05:49:45,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2224/ 3125], loss: 0.354, per_step_time: 1412ms, lr: 2.4030626e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:45,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.66275 samples/s/p 0:21:12 } +2024-07-30 05:49:48,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2226/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 2.3924918e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:48,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.66087 samples/s/p 0:21:10 } +2024-07-30 05:49:50,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2228/ 3125], loss: 0.080, per_step_time: 1413ms, lr: 2.3819446e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:50,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.66029 samples/s/p 0:21:07 } +2024-07-30 05:49:53,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2230/ 3125], loss: 0.273, per_step_time: 1412ms, lr: 2.3714185e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:53,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.66346 samples/s/p 0:21:04 } +2024-07-30 05:49:56,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2232/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 2.3609131e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:56,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.66105 samples/s/p 0:21:01 } +2024-07-30 05:49:59,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2234/ 3125], loss: 0.201, per_step_time: 1412ms, lr: 2.3504346e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:59,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.66281 samples/s/p 0:20:58 } +2024-07-30 05:50:02,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2236/ 3125], loss: 0.298, per_step_time: 1412ms, lr: 2.339977e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:02,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.66307 samples/s/p 0:20:55 } +2024-07-30 05:50:05,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2238/ 3125], loss: 0.213, per_step_time: 1414ms, lr: 2.3295432e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:05,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.65740 samples/s/p 0:20:54 } +2024-07-30 05:50:07,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2240/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 2.3191302e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:07,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.66026 samples/s/p 0:20:50 } +2024-07-30 05:50:10,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2242/ 3125], loss: 0.452, per_step_time: 1413ms, lr: 2.3087412e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:10,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.65950 samples/s/p 0:20:48 } +2024-07-30 05:50:13,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2244/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 2.298379e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:13,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.65962 samples/s/p 0:20:45 } +2024-07-30 05:50:16,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2246/ 3125], loss: 0.451, per_step_time: 1413ms, lr: 2.2880344e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:16,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.66022 samples/s/p 0:20:42 } +2024-07-30 05:50:19,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2248/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 2.277714e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:19,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.65992 samples/s/p 0:20:39 } +2024-07-30 05:50:22,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2250/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 2.2674172e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:22,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.66015 samples/s/p 0:20:36 } +2024-07-30 05:50:24,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2252/ 3125], loss: 0.304, per_step_time: 1414ms, lr: 2.2571385e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:24,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.65763 samples/s/p 0:20:34 } +2024-07-30 05:50:27,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2254/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 2.2468895e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:27,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.65926 samples/s/p 0:20:31 } +2024-07-30 05:50:30,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2256/ 3125], loss: 0.151, per_step_time: 1413ms, lr: 2.2366582e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:30,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.66102 samples/s/p 0:20:28 } +2024-07-30 05:50:33,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2258/ 3125], loss: 0.187, per_step_time: 1414ms, lr: 2.226451e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:33,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.65757 samples/s/p 0:20:25 } +2024-07-30 05:50:36,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2260/ 3125], loss: 0.350, per_step_time: 1414ms, lr: 2.2162705e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:36,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.65650 samples/s/p 0:20:23 } +2024-07-30 05:50:39,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2262/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 2.2061108e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:39,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.65874 samples/s/p 0:20:20 } +2024-07-30 05:50:41,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2264/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 2.1959691e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:41,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.66142 samples/s/p 0:20:16 } +2024-07-30 05:50:44,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2266/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 2.1858513e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:44,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.66132 samples/s/p 0:20:13 } +2024-07-30 05:50:47,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2268/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 2.1757631e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:47,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.65863 samples/s/p 0:20:11 } +2024-07-30 05:50:50,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2270/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 2.165693e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:50,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.66126 samples/s/p 0:20:08 } +2024-07-30 05:50:53,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2272/ 3125], loss: 0.159, per_step_time: 1414ms, lr: 2.1556467e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:53,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.65609 samples/s/p 0:20:06 } +2024-07-30 05:50:56,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2274/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 2.145627e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:56,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.65892 samples/s/p 0:20:03 } +2024-07-30 05:50:58,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2276/ 3125], loss: 0.102, per_step_time: 1413ms, lr: 2.1356195e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:58,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.65790 samples/s/p 0:20:00 } +2024-07-30 05:51:01,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2278/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 2.1256416e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:01,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.65789 samples/s/p 0:19:57 } +2024-07-30 05:51:04,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2280/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 2.1156906e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:04,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.65566 samples/s/p 0:19:55 } +2024-07-30 05:51:07,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2282/ 3125], loss: 0.166, per_step_time: 1415ms, lr: 2.1057605e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:07,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.65337 samples/s/p 0:19:52 } +2024-07-30 05:51:10,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2284/ 3125], loss: 0.233, per_step_time: 1415ms, lr: 2.0958453e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:10,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.65252 samples/s/p 0:19:50 } +2024-07-30 05:51:13,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2286/ 3125], loss: 0.250, per_step_time: 1414ms, lr: 2.0859599e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:13,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.65499 samples/s/p 0:19:46 } +2024-07-30 05:51:15,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2288/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 2.0760953e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:15,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.65812 samples/s/p 0:19:43 } +2024-07-30 05:51:18,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2290/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 2.0662516e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:18,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.65912 samples/s/p 0:19:40 } +2024-07-30 05:51:21,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2292/ 3125], loss: 0.436, per_step_time: 1413ms, lr: 2.0564347e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:21,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.65807 samples/s/p 0:19:37 } +2024-07-30 05:51:24,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2294/ 3125], loss: 0.319, per_step_time: 1412ms, lr: 2.0466386e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:24,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.66254 samples/s/p 0:19:34 } +2024-07-30 05:51:27,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2296/ 3125], loss: 0.166, per_step_time: 1415ms, lr: 2.0368695e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:27,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.64976 samples/s/p 0:19:33 } +2024-07-30 05:51:30,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2298/ 3125], loss: 0.158, per_step_time: 1412ms, lr: 2.0271182e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:30,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.66225 samples/s/p 0:19:28 } +2024-07-30 05:51:32,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2300/ 3125], loss: 0.330, per_step_time: 1412ms, lr: 2.0173967e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:32,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.66191 samples/s/p 0:19:25 } +2024-07-30 05:51:35,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2302/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 2.007693e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:35,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.65937 samples/s/p 0:19:23 } +2024-07-30 05:51:38,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2304/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 1.9980102e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:38,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.66083 samples/s/p 0:19:20 } +2024-07-30 05:51:41,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2306/ 3125], loss: 0.122, per_step_time: 1412ms, lr: 1.9883512e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:41,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.66175 samples/s/p 0:19:17 } +2024-07-30 05:51:44,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2308/ 3125], loss: 0.206, per_step_time: 1412ms, lr: 1.9787161e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:44,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.66215 samples/s/p 0:19:14 } +2024-07-30 05:51:47,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2310/ 3125], loss: 0.457, per_step_time: 1412ms, lr: 1.969102e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:47,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.66218 samples/s/p 0:19:11 } +2024-07-30 05:51:49,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2312/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 1.9595146e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:49,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.66045 samples/s/p 0:19:09 } +2024-07-30 05:51:52,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2314/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 1.949951e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:52,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.66153 samples/s/p 0:19:05 } +2024-07-30 05:51:55,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2316/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 1.9404054e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:55,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.66159 samples/s/p 0:19:03 } +2024-07-30 05:51:58,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2318/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 1.9308835e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:58,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.65828 samples/s/p 0:19:00 } +2024-07-30 05:52:01,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2320/ 3125], loss: 0.210, per_step_time: 1414ms, lr: 1.9213884e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:01,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.65739 samples/s/p 0:18:58 } +2024-07-30 05:52:04,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2322/ 3125], loss: 0.131, per_step_time: 1414ms, lr: 1.9119173e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:04,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.65527 samples/s/p 0:18:55 } +2024-07-30 05:52:06,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2324/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 1.902464e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:06,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.65967 samples/s/p 0:18:52 } +2024-07-30 05:52:09,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2326/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 1.8930375e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:09,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.66079 samples/s/p 0:18:49 } +2024-07-30 05:52:12,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2328/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 1.8836319e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:12,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.65959 samples/s/p 0:18:46 } +2024-07-30 05:52:15,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2330/ 3125], loss: 0.352, per_step_time: 1412ms, lr: 1.8742502e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:15,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.66279 samples/s/p 0:18:43 } +2024-07-30 05:52:18,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2332/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 1.8648892e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:18,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.65862 samples/s/p 0:18:41 } +2024-07-30 05:52:21,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2334/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 1.8555491e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:21,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.65875 samples/s/p 0:18:38 } +2024-07-30 05:52:23,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2336/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 1.8462389e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:23,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.65961 samples/s/p 0:18:35 } +2024-07-30 05:52:26,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2338/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 1.8369495e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:26,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.65781 samples/s/p 0:18:32 } +2024-07-30 05:52:29,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2340/ 3125], loss: 0.076, per_step_time: 1413ms, lr: 1.827684e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:29,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.66097 samples/s/p 0:18:29 } +2024-07-30 05:52:32,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2342/ 3125], loss: 0.252, per_step_time: 1414ms, lr: 1.8184393e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:32,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.65508 samples/s/p 0:18:27 } +2024-07-30 05:52:35,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2344/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 1.8092155e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:35,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.65920 samples/s/p 0:18:24 } +2024-07-30 05:52:38,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2346/ 3125], loss: 0.045, per_step_time: 1413ms, lr: 1.8000215e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:38,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.65992 samples/s/p 0:18:21 } +2024-07-30 05:52:40,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2348/ 3125], loss: 0.177, per_step_time: 1414ms, lr: 1.7908394e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:40,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.65711 samples/s/p 0:18:18 } +2024-07-30 05:52:43,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2350/ 3125], loss: 0.268, per_step_time: 1414ms, lr: 1.78169e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:43,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.65754 samples/s/p 0:18:15 } +2024-07-30 05:52:46,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2352/ 3125], loss: 0.405, per_step_time: 1413ms, lr: 1.7725617e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:46,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.65937 samples/s/p 0:18:12 } +2024-07-30 05:52:49,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2354/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 1.7634571e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:49,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.66054 samples/s/p 0:18:09 } +2024-07-30 05:52:52,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2356/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 1.7543672e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:52,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.65897 samples/s/p 0:18:07 } +2024-07-30 05:52:55,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2358/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 1.7453104e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:55,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.65771 samples/s/p 0:18:04 } +2024-07-30 05:52:57,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2360/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 1.7362743e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:57,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.65772 samples/s/p 0:18:01 } +2024-07-30 05:53:00,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2362/ 3125], loss: 0.292, per_step_time: 1414ms, lr: 1.7272562e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:00,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.65689 samples/s/p 0:17:59 } +2024-07-30 05:53:03,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2364/ 3125], loss: 0.434, per_step_time: 1413ms, lr: 1.7182677e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:03,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.65902 samples/s/p 0:17:55 } +2024-07-30 05:53:06,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2366/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 1.7093032e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:06,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.65901 samples/s/p 0:17:52 } +2024-07-30 05:53:09,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2368/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 1.7003566e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:09,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.65990 samples/s/p 0:17:49 } +2024-07-30 05:53:12,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2370/ 3125], loss: 0.115, per_step_time: 1412ms, lr: 1.6914368e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:12,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.66257 samples/s/p 0:17:46 } +2024-07-30 05:53:14,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2372/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 1.6825408e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:14,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |█████████████████████████████████████████████ | 5.66121 samples/s/p 0:17:44 } +2024-07-30 05:53:17,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2374/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 1.6736627e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:17,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |█████████████████████████████████████████████ | 5.65983 samples/s/p 0:17:41 } +2024-07-30 05:53:20,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2376/ 3125], loss: 0.204, per_step_time: 1412ms, lr: 1.6648083e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:20,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.66270 samples/s/p 0:17:38 } +2024-07-30 05:53:23,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2378/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 1.655975e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:23,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.65960 samples/s/p 0:17:35 } +2024-07-30 05:53:26,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2380/ 3125], loss: 0.391, per_step_time: 1413ms, lr: 1.6471714e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:26,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.66091 samples/s/p 0:17:32 } +2024-07-30 05:53:29,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2382/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 1.6383856e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:29,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.66089 samples/s/p 0:17:30 } +2024-07-30 05:53:31,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2384/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 1.6296268e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:31,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.66010 samples/s/p 0:17:27 } +2024-07-30 05:53:34,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2386/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 1.6208917e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:34,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.66006 samples/s/p 0:17:24 } +2024-07-30 05:53:37,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2388/ 3125], loss: 0.043, per_step_time: 1413ms, lr: 1.6121744e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:37,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.65888 samples/s/p 0:17:21 } +2024-07-30 05:53:40,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2390/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 1.603484e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:40,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.66044 samples/s/p 0:17:18 } +2024-07-30 05:53:43,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2392/ 3125], loss: 0.164, per_step_time: 1414ms, lr: 1.5948176e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:43,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.65534 samples/s/p 0:17:16 } +2024-07-30 05:53:46,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2394/ 3125], loss: 0.124, per_step_time: 1413ms, lr: 1.586169e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:46,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.65850 samples/s/p 0:17:13 } +2024-07-30 05:53:48,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2396/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 1.5775501e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:48,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.65935 samples/s/p 0:17:10 } +2024-07-30 05:53:51,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2398/ 3125], loss: 0.399, per_step_time: 1414ms, lr: 1.5689491e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:51,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.65694 samples/s/p 0:17:08 } +2024-07-30 05:53:54,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2400/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 1.560378e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:54,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.66094 samples/s/p 0:17:04 } +2024-07-30 05:53:57,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2402/ 3125], loss: 0.127, per_step_time: 1413ms, lr: 1.5518218e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:57,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.66003 samples/s/p 0:17:01 } +2024-07-30 05:54:00,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2404/ 3125], loss: 0.141, per_step_time: 1414ms, lr: 1.5432924e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:00,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.65758 samples/s/p 0:16:59 } +2024-07-30 05:54:03,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2406/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 1.5347868e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:03,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.65782 samples/s/p 0:16:56 } +2024-07-30 05:54:05,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2408/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 1.5263021e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:05,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.65397 samples/s/p 0:16:54 } +2024-07-30 05:54:08,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2410/ 3125], loss: 0.340, per_step_time: 1414ms, lr: 1.5178442e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:08,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.65746 samples/s/p 0:16:51 } +2024-07-30 05:54:11,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2412/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 1.509407e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:11,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.65855 samples/s/p 0:16:48 } +2024-07-30 05:54:14,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2414/ 3125], loss: 0.275, per_step_time: 1414ms, lr: 1.5009999e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:14,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.65737 samples/s/p 0:16:45 } +2024-07-30 05:54:17,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2416/ 3125], loss: 0.377, per_step_time: 1413ms, lr: 1.4926076e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:17,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.66064 samples/s/p 0:16:42 } +2024-07-30 05:54:20,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2418/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 1.4842361e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:20,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.65839 samples/s/p 0:16:39 } +2024-07-30 05:54:22,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2420/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 1.4758915e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:22,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.66060 samples/s/p 0:16:36 } +2024-07-30 05:54:25,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2422/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 1.4675706e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:25,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.66096 samples/s/p 0:16:33 } +2024-07-30 05:54:28,659 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2424/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 1.4592736e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:28,660 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.66086 samples/s/p 0:16:30 } +2024-07-30 05:54:31,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2426/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 1.4509976e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:31,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.66030 samples/s/p 0:16:27 } +2024-07-30 05:54:34,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2428/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 1.4427512e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:34,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.66012 samples/s/p 0:16:25 } +2024-07-30 05:54:37,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2430/ 3125], loss: 0.204, per_step_time: 1412ms, lr: 1.4345228e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:37,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.66215 samples/s/p 0:16:21 } +2024-07-30 05:54:39,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2432/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 1.4263212e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:39,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.65947 samples/s/p 0:16:19 } +2024-07-30 05:54:42,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2434/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 1.4181346e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:42,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.66082 samples/s/p 0:16:16 } +2024-07-30 05:54:45,660 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2436/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 1.4099747e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:45,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.65964 samples/s/p 0:16:13 } +2024-07-30 05:54:48,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2438/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 1.4018386e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:48,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.65973 samples/s/p 0:16:11 } +2024-07-30 05:54:51,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2440/ 3125], loss: 0.349, per_step_time: 1413ms, lr: 1.3937324e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:51,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.66064 samples/s/p 0:16:08 } +2024-07-30 05:54:54,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2442/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 1.385638e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:54,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.66002 samples/s/p 0:16:05 } +2024-07-30 05:54:56,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2444/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 1.3775735e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:56,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.65889 samples/s/p 0:16:02 } +2024-07-30 05:54:59,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2446/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 1.3695359e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:59,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.66112 samples/s/p 0:15:59 } +2024-07-30 05:55:02,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2448/ 3125], loss: 0.274, per_step_time: 1414ms, lr: 1.3615131e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:02,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.65690 samples/s/p 0:15:57 } +2024-07-30 05:55:05,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2450/ 3125], loss: 0.194, per_step_time: 1418ms, lr: 1.3535141e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:05,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.64029 samples/s/p 0:15:57 } +2024-07-30 05:55:08,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2452/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 1.345545e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:08,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.65961 samples/s/p 0:15:51 } +2024-07-30 05:55:11,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2454/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 1.3375967e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:11,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.65875 samples/s/p 0:15:48 } +2024-07-30 05:55:14,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2456/ 3125], loss: 0.244, per_step_time: 1414ms, lr: 1.3296693e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:14,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.65687 samples/s/p 0:15:46 } +2024-07-30 05:55:16,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2458/ 3125], loss: 0.178, per_step_time: 1415ms, lr: 1.3217628e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:16,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.65264 samples/s/p 0:15:43 } +2024-07-30 05:55:19,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2460/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 1.313889e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:19,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.66092 samples/s/p 0:15:39 } +2024-07-30 05:55:22,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2462/ 3125], loss: 0.099, per_step_time: 1413ms, lr: 1.3060301e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:22,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.66155 samples/s/p 0:15:36 } +2024-07-30 05:55:25,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2464/ 3125], loss: 0.348, per_step_time: 1413ms, lr: 1.2981981e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:25,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.66059 samples/s/p 0:15:34 } +2024-07-30 05:55:28,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2466/ 3125], loss: 0.240, per_step_time: 1414ms, lr: 1.290381e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:28,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.65747 samples/s/p 0:15:31 } +2024-07-30 05:55:31,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2468/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 1.2825936e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:31,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.66096 samples/s/p 0:15:28 } +2024-07-30 05:55:33,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2470/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 1.274833e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:33,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.65996 samples/s/p 0:15:25 } +2024-07-30 05:55:36,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2472/ 3125], loss: 0.237, per_step_time: 1414ms, lr: 1.2670934e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:36,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.65556 samples/s/p 0:15:23 } +2024-07-30 05:55:39,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2474/ 3125], loss: 0.373, per_step_time: 1413ms, lr: 1.2593746e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:39,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.65957 samples/s/p 0:15:20 } +2024-07-30 05:55:42,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2476/ 3125], loss: 0.178, per_step_time: 1414ms, lr: 1.2516796e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:42,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.65753 samples/s/p 0:15:17 } +2024-07-30 05:55:45,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2478/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 1.2440115e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:45,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.66067 samples/s/p 0:15:14 } +2024-07-30 05:55:48,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2480/ 3125], loss: 0.105, per_step_time: 1413ms, lr: 1.2363672e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:48,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.65823 samples/s/p 0:15:11 } +2024-07-30 05:55:50,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2482/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 1.2287408e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:50,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.66072 samples/s/p 0:15:08 } +2024-07-30 05:55:53,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2484/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 1.2211382e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:53,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.66141 samples/s/p 0:15:05 } +2024-07-30 05:55:56,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2486/ 3125], loss: 0.445, per_step_time: 1413ms, lr: 1.2135625e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:56,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.65845 samples/s/p 0:15:03 } +2024-07-30 05:55:59,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2488/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 1.2060076e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:59,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.66113 samples/s/p 0:15:00 } +2024-07-30 05:56:02,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2490/ 3125], loss: 0.244, per_step_time: 1412ms, lr: 1.1984795e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:02,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.66191 samples/s/p 0:14:57 } +2024-07-30 05:56:05,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2492/ 3125], loss: 0.110, per_step_time: 1413ms, lr: 1.1909723e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:05,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.65965 samples/s/p 0:14:54 } +2024-07-30 05:56:07,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2494/ 3125], loss: 0.096, per_step_time: 1413ms, lr: 1.18348595e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:07,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.66054 samples/s/p 0:14:51 } +2024-07-30 05:56:10,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2496/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 1.1760235e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:10,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.66005 samples/s/p 0:14:49 } +2024-07-30 05:56:13,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2498/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 1.1685848e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:13,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.65892 samples/s/p 0:14:46 } +2024-07-30 05:56:16,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2500/ 3125], loss: 0.334, per_step_time: 1414ms, lr: 1.1611759e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:16,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.65657 samples/s/p 0:14:43 } +2024-07-30 05:56:19,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2502/ 3125], loss: 0.413, per_step_time: 1415ms, lr: 1.153782e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:19,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.65292 samples/s/p 0:14:41 } +2024-07-30 05:56:22,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2504/ 3125], loss: 0.376, per_step_time: 1413ms, lr: 1.14641786e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:22,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.66051 samples/s/p 0:14:37 } +2024-07-30 05:56:24,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2506/ 3125], loss: 0.242, per_step_time: 1412ms, lr: 1.13907156e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:24,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.66197 samples/s/p 0:14:34 } +2024-07-30 05:56:27,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2508/ 3125], loss: 0.164, per_step_time: 1413ms, lr: 1.1317521e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:27,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.66116 samples/s/p 0:14:31 } +2024-07-30 05:56:30,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2510/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 1.1244505e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:30,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.66059 samples/s/p 0:14:29 } +2024-07-30 05:56:33,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2512/ 3125], loss: 0.341, per_step_time: 1414ms, lr: 1.11717874e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:33,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.65499 samples/s/p 0:14:27 } +2024-07-30 05:56:36,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2514/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 1.1099249e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:36,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.65959 samples/s/p 0:14:23 } +2024-07-30 05:56:39,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2516/ 3125], loss: 0.254, per_step_time: 1414ms, lr: 1.1027008e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:39,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.65706 samples/s/p 0:14:21 } +2024-07-30 05:56:41,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2518/ 3125], loss: 0.192, per_step_time: 1415ms, lr: 1.0954946e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:41,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.65332 samples/s/p 0:14:18 } +2024-07-30 05:56:44,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2520/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 1.0883152e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:44,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.66157 samples/s/p 0:14:14 } +2024-07-30 05:56:47,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2522/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 1.0811567e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:47,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.66136 samples/s/p 0:14:12 } +2024-07-30 05:56:50,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2524/ 3125], loss: 0.348, per_step_time: 1412ms, lr: 1.074025e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:50,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.66200 samples/s/p 0:14:09 } +2024-07-30 05:56:53,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2526/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 1.0669142e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:53,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.66130 samples/s/p 0:14:06 } +2024-07-30 05:56:56,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2528/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 1.0598272e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:56,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.65985 samples/s/p 0:14:03 } +2024-07-30 05:56:58,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2530/ 3125], loss: 0.130, per_step_time: 1412ms, lr: 1.0527551e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:58,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.66228 samples/s/p 0:14:00 } +2024-07-30 05:57:01,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2532/ 3125], loss: 0.062, per_step_time: 1413ms, lr: 1.04571576e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:01,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.66165 samples/s/p 0:13:57 } +2024-07-30 05:57:04,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2534/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 1.0387033e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:04,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.66169 samples/s/p 0:13:55 } +2024-07-30 05:57:07,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2536/ 3125], loss: 0.319, per_step_time: 1412ms, lr: 1.0317057e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:07,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.66233 samples/s/p 0:13:52 } +2024-07-30 05:57:10,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2538/ 3125], loss: 0.071, per_step_time: 1415ms, lr: 1.0247349e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:10,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.65336 samples/s/p 0:13:50 } +2024-07-30 05:57:13,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2540/ 3125], loss: 0.294, per_step_time: 1413ms, lr: 1.017788e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:13,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.65889 samples/s/p 0:13:47 } +2024-07-30 05:57:15,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2542/ 3125], loss: 0.164, per_step_time: 1414ms, lr: 1.0108679e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:15,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.65540 samples/s/p 0:13:44 } +2024-07-30 05:57:18,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2544/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 1.0039687e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:18,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.65785 samples/s/p 0:13:41 } +2024-07-30 05:57:21,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2546/ 3125], loss: 0.241, per_step_time: 1412ms, lr: 9.9709034e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:21,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.66331 samples/s/p 0:13:37 } +2024-07-30 05:57:24,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2548/ 3125], loss: 0.436, per_step_time: 1414ms, lr: 9.902358e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:24,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.65702 samples/s/p 0:13:35 } +2024-07-30 05:57:27,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2550/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 9.834021e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:27,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.66128 samples/s/p 0:13:32 } +2024-07-30 05:57:30,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2552/ 3125], loss: 0.283, per_step_time: 1414ms, lr: 9.765982e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:30,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.65742 samples/s/p 0:13:30 } +2024-07-30 05:57:32,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2554/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 9.6981225e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:32,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.66113 samples/s/p 0:13:26 } +2024-07-30 05:57:35,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2556/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 9.630531e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:35,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.66093 samples/s/p 0:13:24 } +2024-07-30 05:57:38,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2558/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 9.5631776e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:38,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.66018 samples/s/p 0:13:21 } +2024-07-30 05:57:41,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2560/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 9.4960626e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:41,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.66064 samples/s/p 0:13:18 } +2024-07-30 05:57:44,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2562/ 3125], loss: 0.318, per_step_time: 1426ms, lr: 9.429186e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:44,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.60988 samples/s/p 0:13:22 } +2024-07-30 05:57:47,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2564/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 9.362459e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:47,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |███████████████████████████████████████████████ | 5.65913 samples/s/p 0:13:13 } +2024-07-30 05:57:49,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2566/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 9.29603e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:49,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |███████████████████████████████████████████████ | 5.66046 samples/s/p 0:13:10 } +2024-07-30 05:57:52,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2568/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 9.2298386e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:52,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.65580 samples/s/p 0:13:07 } +2024-07-30 05:57:55,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2570/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 9.163886e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:55,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.66156 samples/s/p 0:13:04 } +2024-07-30 05:57:58,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2572/ 3125], loss: 0.212, per_step_time: 1414ms, lr: 9.098202e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:58,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.65549 samples/s/p 0:13:02 } +2024-07-30 05:58:01,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2574/ 3125], loss: 0.321, per_step_time: 1413ms, lr: 9.032637e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:01,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.65852 samples/s/p 0:12:59 } +2024-07-30 05:58:04,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2576/ 3125], loss: 0.447, per_step_time: 1413ms, lr: 8.9674295e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:04,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.65797 samples/s/p 0:12:56 } +2024-07-30 05:58:06,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2578/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 8.9024006e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:06,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.66104 samples/s/p 0:12:53 } +2024-07-30 05:58:09,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2580/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 8.83764e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:09,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.66149 samples/s/p 0:12:50 } +2024-07-30 05:58:12,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2582/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 8.7730584e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:12,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.65977 samples/s/p 0:12:47 } +2024-07-30 05:58:15,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2584/ 3125], loss: 0.226, per_step_time: 1414ms, lr: 8.708715e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:15,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.65635 samples/s/p 0:12:45 } +2024-07-30 05:58:18,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2586/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 8.64467e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:18,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.66137 samples/s/p 0:12:41 } +2024-07-30 05:58:21,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2588/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 8.580774e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:21,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.66043 samples/s/p 0:12:38 } +2024-07-30 05:58:23,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2590/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 8.5171756e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:23,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.66032 samples/s/p 0:12:36 } +2024-07-30 05:58:26,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2592/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 8.453816e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:26,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.66031 samples/s/p 0:12:33 } +2024-07-30 05:58:29,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2594/ 3125], loss: 0.322, per_step_time: 1413ms, lr: 8.390635e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:29,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.65854 samples/s/p 0:12:30 } +2024-07-30 05:58:32,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2596/ 3125], loss: 0.275, per_step_time: 1414ms, lr: 8.327722e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:32,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.65569 samples/s/p 0:12:28 } +2024-07-30 05:58:35,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2598/ 3125], loss: 0.081, per_step_time: 1414ms, lr: 8.265048e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:35,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.65703 samples/s/p 0:12:25 } +2024-07-30 05:58:38,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2600/ 3125], loss: 0.168, per_step_time: 1412ms, lr: 8.202642e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:38,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.66186 samples/s/p 0:12:21 } +2024-07-30 05:58:40,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2602/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 8.1404444e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:40,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.66012 samples/s/p 0:12:19 } +2024-07-30 05:58:43,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2604/ 3125], loss: 0.317, per_step_time: 1412ms, lr: 8.078426e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:43,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.66250 samples/s/p 0:12:16 } +2024-07-30 05:58:46,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2606/ 3125], loss: 0.304, per_step_time: 1412ms, lr: 8.0167055e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:46,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.66279 samples/s/p 0:12:13 } +2024-07-30 05:58:49,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2608/ 3125], loss: 0.178, per_step_time: 1414ms, lr: 7.955163e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:49,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.65726 samples/s/p 0:12:11 } +2024-07-30 05:58:52,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2610/ 3125], loss: 0.246, per_step_time: 1412ms, lr: 7.893949e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:52,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.66190 samples/s/p 0:12:07 } +2024-07-30 05:58:55,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2612/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 7.8329144e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:55,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.66028 samples/s/p 0:12:05 } +2024-07-30 05:58:57,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2614/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 7.7721474e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:57,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.66142 samples/s/p 0:12:02 } +2024-07-30 05:59:00,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2616/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 7.7115295e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:00,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.66145 samples/s/p 0:11:59 } +2024-07-30 05:59:03,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2618/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 7.6512094e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:03,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.66036 samples/s/p 0:11:56 } +2024-07-30 05:59:06,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2620/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 7.591128e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:06,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.65880 samples/s/p 0:11:53 } +2024-07-30 05:59:09,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2622/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 7.5312556e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:09,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.66056 samples/s/p 0:11:50 } +2024-07-30 05:59:12,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2624/ 3125], loss: 0.343, per_step_time: 1425ms, lr: 7.47165e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:12,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.61230 samples/s/p 0:11:54 } +2024-07-30 05:59:14,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2626/ 3125], loss: 0.095, per_step_time: 1413ms, lr: 7.4122546e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:14,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.65778 samples/s/p 0:11:45 } +2024-07-30 05:59:17,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2628/ 3125], loss: 0.128, per_step_time: 1414ms, lr: 7.353127e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:17,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.65520 samples/s/p 0:11:43 } +2024-07-30 05:59:20,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2630/ 3125], loss: 0.312, per_step_time: 1412ms, lr: 7.294178e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:20,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.66239 samples/s/p 0:11:39 } +2024-07-30 05:59:23,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2632/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 7.235497e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:23,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.65979 samples/s/p 0:11:36 } +2024-07-30 05:59:26,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2634/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 7.177055e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:26,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.65909 samples/s/p 0:11:34 } +2024-07-30 05:59:29,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2636/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 7.118821e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:29,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.65976 samples/s/p 0:11:31 } +2024-07-30 05:59:31,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2638/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 7.0609154e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:31,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.65988 samples/s/p 0:11:28 } +2024-07-30 05:59:34,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2640/ 3125], loss: 0.352, per_step_time: 1414ms, lr: 7.003158e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:34,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.65763 samples/s/p 0:11:25 } +2024-07-30 05:59:37,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2642/ 3125], loss: 0.435, per_step_time: 1414ms, lr: 6.94561e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:37,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.65387 samples/s/p 0:11:23 } +2024-07-30 05:59:40,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2644/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 6.8883594e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:40,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.65836 samples/s/p 0:11:20 } +2024-07-30 05:59:43,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2646/ 3125], loss: 0.293, per_step_time: 1413ms, lr: 6.831318e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:43,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.66067 samples/s/p 0:11:16 } +2024-07-30 05:59:46,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2648/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 6.774515e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:46,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.66047 samples/s/p 0:11:14 } +2024-07-30 05:59:48,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2650/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 6.71792e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:48,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.65985 samples/s/p 0:11:11 } +2024-07-30 05:59:51,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2652/ 3125], loss: 0.039, per_step_time: 1413ms, lr: 6.661624e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:51,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.66108 samples/s/p 0:11:08 } +2024-07-30 05:59:54,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2654/ 3125], loss: 0.388, per_step_time: 1416ms, lr: 6.605536e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:54,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.64670 samples/s/p 0:11:07 } +2024-07-30 05:59:57,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2656/ 3125], loss: 0.434, per_step_time: 1413ms, lr: 6.549686e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:57,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.66076 samples/s/p 0:11:02 } +2024-07-30 06:00:00,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2658/ 3125], loss: 0.437, per_step_time: 1415ms, lr: 6.494045e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:00,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.65347 samples/s/p 0:11:00 } +2024-07-30 06:00:03,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2660/ 3125], loss: 0.326, per_step_time: 1412ms, lr: 6.4386725e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:03,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.66195 samples/s/p 0:10:57 } +2024-07-30 06:00:05,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2662/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 6.383538e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:05,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.65956 samples/s/p 0:10:54 } +2024-07-30 06:00:08,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2664/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 6.328612e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:08,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.65920 samples/s/p 0:10:51 } +2024-07-30 06:00:11,659 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2666/ 3125], loss: 0.284, per_step_time: 1412ms, lr: 6.273955e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:11,660 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.66190 samples/s/p 0:10:48 } +2024-07-30 06:00:14,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2668/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 6.2194765e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:14,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.66064 samples/s/p 0:10:45 } +2024-07-30 06:00:17,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2670/ 3125], loss: 0.177, per_step_time: 1412ms, lr: 6.1652656e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:17,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.66347 samples/s/p 0:10:42 } +2024-07-30 06:00:20,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2672/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 6.111294e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:20,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.65827 samples/s/p 0:10:40 } +2024-07-30 06:00:22,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2674/ 3125], loss: 0.306, per_step_time: 1412ms, lr: 6.05759e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:22,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.66238 samples/s/p 0:10:37 } +2024-07-30 06:00:25,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2676/ 3125], loss: 0.108, per_step_time: 1413ms, lr: 6.0041245e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:25,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.65954 samples/s/p 0:10:34 } +2024-07-30 06:00:28,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2678/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 5.950838e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:28,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.65810 samples/s/p 0:10:32 } +2024-07-30 06:00:31,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2680/ 3125], loss: 0.439, per_step_time: 1413ms, lr: 5.89779e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:31,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.66040 samples/s/p 0:10:28 } +2024-07-30 06:00:34,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2682/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 5.8449803e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:34,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.65887 samples/s/p 0:10:26 } +2024-07-30 06:00:37,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2684/ 3125], loss: 0.422, per_step_time: 1414ms, lr: 5.792439e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:37,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.65658 samples/s/p 0:10:23 } +2024-07-30 06:00:39,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2686/ 3125], loss: 0.234, per_step_time: 1412ms, lr: 5.7401657e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:39,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.66180 samples/s/p 0:10:20 } +2024-07-30 06:00:42,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2688/ 3125], loss: 0.657, per_step_time: 1413ms, lr: 5.6880115e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:42,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.66010 samples/s/p 0:10:17 } +2024-07-30 06:00:45,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2690/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 5.6361852e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:45,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.66070 samples/s/p 0:10:14 } +2024-07-30 06:00:48,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2692/ 3125], loss: 0.253, per_step_time: 1414ms, lr: 5.5845973e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:48,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.65646 samples/s/p 0:10:12 } +2024-07-30 06:00:51,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2694/ 3125], loss: 0.072, per_step_time: 1414ms, lr: 5.5332183e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:51,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.65452 samples/s/p 0:10:09 } +2024-07-30 06:00:54,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2696/ 3125], loss: 0.481, per_step_time: 1414ms, lr: 5.4820475e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:54,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.65411 samples/s/p 0:10:06 } +2024-07-30 06:00:57,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2698/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 5.4311453e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:57,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.66111 samples/s/p 0:10:03 } +2024-07-30 06:00:59,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2700/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 5.3805113e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:59,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.66104 samples/s/p 0:10:00 } +2024-07-30 06:01:02,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2702/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 5.3300855e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:02,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.65962 samples/s/p 0:09:57 } +2024-07-30 06:01:05,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2704/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 5.2798686e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:05,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.65892 samples/s/p 0:09:55 } +2024-07-30 06:01:08,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2706/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 5.22992e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:08,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.66000 samples/s/p 0:09:52 } +2024-07-30 06:01:11,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2708/ 3125], loss: 0.297, per_step_time: 1414ms, lr: 5.1802097e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:11,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.65613 samples/s/p 0:09:49 } +2024-07-30 06:01:14,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2710/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 5.1307378e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:14,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.65952 samples/s/p 0:09:46 } +2024-07-30 06:01:16,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2712/ 3125], loss: 0.024, per_step_time: 1413ms, lr: 5.081445e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:16,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.65785 samples/s/p 0:09:43 } +2024-07-30 06:01:19,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2714/ 3125], loss: 0.197, per_step_time: 1414ms, lr: 5.03242e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:19,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.65387 samples/s/p 0:09:41 } +2024-07-30 06:01:22,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2716/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 4.9836633e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:22,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.65924 samples/s/p 0:09:38 } +2024-07-30 06:01:25,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2718/ 3125], loss: 0.164, per_step_time: 1414ms, lr: 4.9351453e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:25,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.65589 samples/s/p 0:09:35 } +2024-07-30 06:01:28,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2720/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 4.886836e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:28,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.65934 samples/s/p 0:09:32 } +2024-07-30 06:01:31,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2722/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 4.8387644e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:31,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.65854 samples/s/p 0:09:29 } +2024-07-30 06:01:33,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2724/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 4.790902e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:33,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.65960 samples/s/p 0:09:26 } +2024-07-30 06:01:36,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2726/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 4.7433375e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:36,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.66128 samples/s/p 0:09:23 } +2024-07-30 06:01:39,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2728/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 4.6959517e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:39,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.66000 samples/s/p 0:09:21 } +2024-07-30 06:01:42,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2730/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 4.6488342e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:42,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.66067 samples/s/p 0:09:18 } +2024-07-30 06:01:45,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2732/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 4.601985e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:45,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.65897 samples/s/p 0:09:15 } +2024-07-30 06:01:48,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2734/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 4.5553147e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:48,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.65961 samples/s/p 0:09:12 } +2024-07-30 06:01:50,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2736/ 3125], loss: 0.227, per_step_time: 1412ms, lr: 4.5088825e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:50,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.66172 samples/s/p 0:09:09 } +2024-07-30 06:01:53,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2738/ 3125], loss: 0.397, per_step_time: 1413ms, lr: 4.462689e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:53,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.66091 samples/s/p 0:09:06 } +2024-07-30 06:01:56,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2740/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 4.416764e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:56,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.66121 samples/s/p 0:09:04 } +2024-07-30 06:01:59,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2742/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 4.3710767e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:59,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.66042 samples/s/p 0:09:01 } +2024-07-30 06:02:02,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2744/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 4.3255984e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:02,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.65943 samples/s/p 0:08:58 } +2024-07-30 06:02:05,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2746/ 3125], loss: 0.068, per_step_time: 1412ms, lr: 4.2803883e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:05,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |███████████████████████████████████████████████ | 5.66217 samples/s/p 0:08:55 } +2024-07-30 06:02:07,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2748/ 3125], loss: 0.357, per_step_time: 1413ms, lr: 4.2353868e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:07,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |███████████████████████████████████████████████ | 5.65789 samples/s/p 0:08:53 } +2024-07-30 06:02:10,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2750/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 4.1906535e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:10,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.66022 samples/s/p 0:08:50 } +2024-07-30 06:02:13,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2752/ 3125], loss: 0.364, per_step_time: 1415ms, lr: 4.1461288e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:13,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.65275 samples/s/p 0:08:47 } +2024-07-30 06:02:16,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2754/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 4.1018424e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:16,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.66090 samples/s/p 0:08:44 } +2024-07-30 06:02:19,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2756/ 3125], loss: 0.309, per_step_time: 1414ms, lr: 4.0577948e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:19,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.65418 samples/s/p 0:08:42 } +2024-07-30 06:02:22,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2758/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 4.014015e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:22,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.66158 samples/s/p 0:08:38 } +2024-07-30 06:02:24,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2760/ 3125], loss: 0.477, per_step_time: 1414ms, lr: 3.9704442e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:24,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.65597 samples/s/p 0:08:36 } +2024-07-30 06:02:27,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2762/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 3.9270518e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:27,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.66013 samples/s/p 0:08:33 } +2024-07-30 06:02:30,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2764/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 3.8839875e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:30,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.66071 samples/s/p 0:08:30 } +2024-07-30 06:02:33,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2766/ 3125], loss: 0.214, per_step_time: 1412ms, lr: 3.841102e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:33,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.66286 samples/s/p 0:08:27 } +2024-07-30 06:02:36,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2768/ 3125], loss: 0.448, per_step_time: 1413ms, lr: 3.7985146e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:36,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.66069 samples/s/p 0:08:24 } +2024-07-30 06:02:39,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2770/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 3.7561357e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:39,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.66137 samples/s/p 0:08:21 } +2024-07-30 06:02:41,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2772/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 3.7139653e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:41,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.66067 samples/s/p 0:08:18 } +2024-07-30 06:02:44,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2774/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 3.6720333e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:44,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.66113 samples/s/p 0:08:16 } +2024-07-30 06:02:47,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2776/ 3125], loss: 0.407, per_step_time: 1412ms, lr: 3.63034e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:47,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.66232 samples/s/p 0:08:13 } +2024-07-30 06:02:50,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2778/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 3.5889446e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:50,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.66065 samples/s/p 0:08:10 } +2024-07-30 06:02:53,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2780/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 3.5476685e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:53,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.66126 samples/s/p 0:08:07 } +2024-07-30 06:02:56,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2782/ 3125], loss: 0.459, per_step_time: 1413ms, lr: 3.5067497e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:56,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.66043 samples/s/p 0:08:04 } +2024-07-30 06:02:58,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2784/ 3125], loss: 0.311, per_step_time: 1416ms, lr: 3.46601e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:58,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.64942 samples/s/p 0:08:02 } +2024-07-30 06:03:01,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2786/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 3.4255386e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:01,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.66034 samples/s/p 0:07:59 } +2024-07-30 06:03:04,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2788/ 3125], loss: 0.211, per_step_time: 1414ms, lr: 3.3852753e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:04,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.65727 samples/s/p 0:07:56 } +2024-07-30 06:03:07,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2790/ 3125], loss: 0.353, per_step_time: 1414ms, lr: 3.3452807e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:07,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.65726 samples/s/p 0:07:53 } +2024-07-30 06:03:10,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2792/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 3.3054945e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:10,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.65845 samples/s/p 0:07:50 } +2024-07-30 06:03:13,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2794/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 3.265947e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:13,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.66018 samples/s/p 0:07:47 } +2024-07-30 06:03:15,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2796/ 3125], loss: 0.270, per_step_time: 1414ms, lr: 3.226608e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:15,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.65455 samples/s/p 0:07:45 } +2024-07-30 06:03:18,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2798/ 3125], loss: 0.333, per_step_time: 1414ms, lr: 3.187567e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:18,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.65733 samples/s/p 0:07:42 } +2024-07-30 06:03:21,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2800/ 3125], loss: 0.323, per_step_time: 1413ms, lr: 3.1487644e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:21,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.65805 samples/s/p 0:07:39 } +2024-07-30 06:03:24,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2802/ 3125], loss: 0.151, per_step_time: 1414ms, lr: 3.1101703e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:24,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.65735 samples/s/p 0:07:36 } +2024-07-30 06:03:27,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2804/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 3.071755e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:27,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.66054 samples/s/p 0:07:33 } +2024-07-30 06:03:30,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2806/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 3.033668e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:30,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.66050 samples/s/p 0:07:30 } +2024-07-30 06:03:32,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2808/ 3125], loss: 0.221, per_step_time: 1414ms, lr: 2.995759e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:32,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.65658 samples/s/p 0:07:28 } +2024-07-30 06:03:35,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2810/ 3125], loss: 0.115, per_step_time: 1412ms, lr: 2.9581486e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:35,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.66255 samples/s/p 0:07:25 } +2024-07-30 06:03:38,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2812/ 3125], loss: 0.130, per_step_time: 1413ms, lr: 2.920717e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:38,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.66071 samples/s/p 0:07:22 } +2024-07-30 06:03:41,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2814/ 3125], loss: 0.147, per_step_time: 1412ms, lr: 2.8835236e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:41,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.66194 samples/s/p 0:07:19 } +2024-07-30 06:03:44,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2816/ 3125], loss: 0.315, per_step_time: 1412ms, lr: 2.8466582e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:44,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.66196 samples/s/p 0:07:16 } +2024-07-30 06:03:47,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2818/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 2.8099416e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:47,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.65992 samples/s/p 0:07:13 } +2024-07-30 06:03:49,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2820/ 3125], loss: 0.441, per_step_time: 1412ms, lr: 2.773434e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:49,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.66188 samples/s/p 0:07:10 } +2024-07-30 06:03:52,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2822/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 2.7372538e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:52,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.65964 samples/s/p 0:07:08 } +2024-07-30 06:03:55,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2824/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 2.7012526e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:55,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.65891 samples/s/p 0:07:05 } +2024-07-30 06:03:58,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2826/ 3125], loss: 0.407, per_step_time: 1413ms, lr: 2.6655197e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:58,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.65966 samples/s/p 0:07:02 } +2024-07-30 06:04:01,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2828/ 3125], loss: 0.230, per_step_time: 1414ms, lr: 2.6299952e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:01,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.65385 samples/s/p 0:07:00 } +2024-07-30 06:04:04,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2830/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 2.5947392e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:04,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.66038 samples/s/p 0:06:56 } +2024-07-30 06:04:06,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2832/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 2.5597213e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:06,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.66023 samples/s/p 0:06:54 } +2024-07-30 06:04:09,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2834/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 2.5248527e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:09,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.66110 samples/s/p 0:06:51 } +2024-07-30 06:04:12,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2836/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 2.4903715e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:12,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.66004 samples/s/p 0:06:48 } +2024-07-30 06:04:15,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2838/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 2.4560093e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:15,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.65895 samples/s/p 0:06:45 } +2024-07-30 06:04:18,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2840/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 2.4219453e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:18,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.65660 samples/s/p 0:06:43 } +2024-07-30 06:04:21,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2842/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 2.3881196e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:21,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.66109 samples/s/p 0:06:39 } +2024-07-30 06:04:23,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2844/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 2.3544729e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:23,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.66103 samples/s/p 0:06:37 } +2024-07-30 06:04:26,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2846/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 2.3211241e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:26,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.65918 samples/s/p 0:06:34 } +2024-07-30 06:04:29,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2848/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 2.2880137e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:29,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.65888 samples/s/p 0:06:31 } +2024-07-30 06:04:32,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2850/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 2.255082e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:32,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.66017 samples/s/p 0:06:28 } +2024-07-30 06:04:35,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2852/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 2.2224187e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:35,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.65788 samples/s/p 0:06:26 } +2024-07-30 06:04:38,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2854/ 3125], loss: 0.231, per_step_time: 1414ms, lr: 2.1899938e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:38,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.65585 samples/s/p 0:06:23 } +2024-07-30 06:04:40,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2856/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 2.1578073e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:40,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.65868 samples/s/p 0:06:20 } +2024-07-30 06:04:43,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2858/ 3125], loss: 0.124, per_step_time: 1414ms, lr: 2.125889e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:43,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.65560 samples/s/p 0:06:17 } +2024-07-30 06:04:46,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2860/ 3125], loss: 0.263, per_step_time: 1414ms, lr: 2.0941794e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:46,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.65726 samples/s/p 0:06:14 } +2024-07-30 06:04:49,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2862/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 2.0627379e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:49,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.65926 samples/s/p 0:06:11 } +2024-07-30 06:04:52,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2864/ 3125], loss: 0.192, per_step_time: 1419ms, lr: 2.0314753e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:52,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.63403 samples/s/p 0:06:10 } +2024-07-30 06:04:55,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2866/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 2.0005107e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:55,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.65848 samples/s/p 0:06:06 } +2024-07-30 06:04:57,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2868/ 3125], loss: 0.290, per_step_time: 1414ms, lr: 1.9697248e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:57,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.65760 samples/s/p 0:06:03 } +2024-07-30 06:05:00,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2870/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 1.9392072e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:00,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.66020 samples/s/p 0:06:00 } +2024-07-30 06:05:03,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2872/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 1.908958e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:03,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.65945 samples/s/p 0:05:57 } +2024-07-30 06:05:06,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2874/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 1.8788874e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:06,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.66093 samples/s/p 0:05:54 } +2024-07-30 06:05:09,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2876/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 1.849085e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:09,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.66002 samples/s/p 0:05:51 } +2024-07-30 06:05:12,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2878/ 3125], loss: 0.268, per_step_time: 1414ms, lr: 1.819521e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:12,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.65730 samples/s/p 0:05:49 } +2024-07-30 06:05:14,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2880/ 3125], loss: 0.092, per_step_time: 1413ms, lr: 1.7902254e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:14,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.66164 samples/s/p 0:05:46 } +2024-07-30 06:05:17,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2882/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 1.7611086e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:17,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.66034 samples/s/p 0:05:43 } +2024-07-30 06:05:20,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2884/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 1.73226e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:20,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.66053 samples/s/p 0:05:40 } +2024-07-30 06:05:23,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2886/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 1.7036497e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:23,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.65966 samples/s/p 0:05:37 } +2024-07-30 06:05:26,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2888/ 3125], loss: 0.341, per_step_time: 1414ms, lr: 1.6752184e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:26,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.65759 samples/s/p 0:05:35 } +2024-07-30 06:05:29,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2890/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 1.6471148e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:29,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.66096 samples/s/p 0:05:32 } +2024-07-30 06:05:31,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2892/ 3125], loss: 0.404, per_step_time: 1414ms, lr: 1.6192198e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:31,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.65660 samples/s/p 0:05:29 } +2024-07-30 06:05:34,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2894/ 3125], loss: 0.324, per_step_time: 1412ms, lr: 1.5915631e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:34,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.66184 samples/s/p 0:05:26 } +2024-07-30 06:05:37,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2896/ 3125], loss: 0.167, per_step_time: 1415ms, lr: 1.5641152e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:37,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.65284 samples/s/p 0:05:24 } +2024-07-30 06:05:40,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2898/ 3125], loss: 0.374, per_step_time: 1412ms, lr: 1.5369654e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:40,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.66190 samples/s/p 0:05:20 } +2024-07-30 06:05:43,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2900/ 3125], loss: 0.129, per_step_time: 1413ms, lr: 1.5099644e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:43,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.66036 samples/s/p 0:05:18 } +2024-07-30 06:05:46,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2902/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 1.4832615e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:46,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.66061 samples/s/p 0:05:15 } +2024-07-30 06:05:48,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2904/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 1.4568269e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:48,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.65863 samples/s/p 0:05:12 } +2024-07-30 06:05:51,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2906/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 1.4305412e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:51,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.65773 samples/s/p 0:05:09 } +2024-07-30 06:05:54,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2908/ 3125], loss: 0.381, per_step_time: 1414ms, lr: 1.4045536e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:54,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.65664 samples/s/p 0:05:06 } +2024-07-30 06:05:57,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2910/ 3125], loss: 0.063, per_step_time: 1413ms, lr: 1.3787746e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:57,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.65866 samples/s/p 0:05:03 } +2024-07-30 06:06:00,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2912/ 3125], loss: 0.152, per_step_time: 1424ms, lr: 1.35329365e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:00,310 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.61439 samples/s/p 0:05:03 } +2024-07-30 06:06:03,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2914/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 1.3279915e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:03,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.66136 samples/s/p 0:04:58 } +2024-07-30 06:06:05,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2916/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 1.3029575e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:05,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.66005 samples/s/p 0:04:55 } +2024-07-30 06:06:08,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2918/ 3125], loss: 0.290, per_step_time: 1415ms, lr: 1.2781322e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:08,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.65177 samples/s/p 0:04:53 } +2024-07-30 06:06:11,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2920/ 3125], loss: 0.135, per_step_time: 1420ms, lr: 1.253575e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:11,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.63326 samples/s/p 0:04:51 } +2024-07-30 06:06:14,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2922/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 1.2292862e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:14,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.65858 samples/s/p 0:04:46 } +2024-07-30 06:06:17,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2924/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 1.20517605e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:17,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.65925 samples/s/p 0:04:44 } +2024-07-30 06:06:20,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2926/ 3125], loss: 0.231, per_step_time: 1415ms, lr: 1.1813044e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:20,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.65268 samples/s/p 0:04:41 } +2024-07-30 06:06:23,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2928/ 3125], loss: 0.131, per_step_time: 1414ms, lr: 1.1576712e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:23,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.65762 samples/s/p 0:04:38 } +2024-07-30 06:06:25,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2930/ 3125], loss: 0.466, per_step_time: 1412ms, lr: 1.1342763e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:25,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.66187 samples/s/p 0:04:35 } +2024-07-30 06:06:28,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2932/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 1.1111796e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:28,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.65932 samples/s/p 0:04:32 } +2024-07-30 06:06:31,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2934/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 1.0882616e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:31,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |████████████████████████████████████████████████ | 5.65652 samples/s/p 0:04:30 } +2024-07-30 06:06:34,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2936/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 1.0656118e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:34,341 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |████████████████████████████████████████████████ | 5.65828 samples/s/p 0:04:27 } +2024-07-30 06:06:37,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2938/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 1.0431707e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:37,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.66126 samples/s/p 0:04:24 } +2024-07-30 06:06:40,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2940/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 1.0209978e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:40,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.66162 samples/s/p 0:04:21 } +2024-07-30 06:06:42,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2942/ 3125], loss: 0.220, per_step_time: 1414ms, lr: 9.990334e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:42,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.65599 samples/s/p 0:04:18 } +2024-07-30 06:06:45,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2944/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 9.773076e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:45,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.65983 samples/s/p 0:04:15 } +2024-07-30 06:06:48,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2946/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 9.558499e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:48,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.65866 samples/s/p 0:04:13 } +2024-07-30 06:06:51,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2948/ 3125], loss: 0.209, per_step_time: 1414ms, lr: 9.346604e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:51,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.65498 samples/s/p 0:04:10 } +2024-07-30 06:06:54,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2950/ 3125], loss: 0.284, per_step_time: 1412ms, lr: 9.136498e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:54,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.66319 samples/s/p 0:04:07 } +2024-07-30 06:06:57,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2952/ 3125], loss: 0.452, per_step_time: 1413ms, lr: 8.9284775e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:57,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.65949 samples/s/p 0:04:04 } +2024-07-30 06:06:59,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2954/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 8.723438e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:59,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.65731 samples/s/p 0:04:01 } +2024-07-30 06:07:02,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2956/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 8.520781e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:02,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.65918 samples/s/p 0:03:58 } +2024-07-30 06:07:05,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2958/ 3125], loss: 0.130, per_step_time: 1414ms, lr: 8.320212e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:05,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.65563 samples/s/p 0:03:56 } +2024-07-30 06:07:08,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2960/ 3125], loss: 0.097, per_step_time: 1414ms, lr: 8.122623e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:08,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.65442 samples/s/p 0:03:53 } +2024-07-30 06:07:11,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2962/ 3125], loss: 0.430, per_step_time: 1413ms, lr: 7.926523e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:11,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.66144 samples/s/p 0:03:50 } +2024-07-30 06:07:14,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2964/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 7.733404e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:14,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.66146 samples/s/p 0:03:47 } +2024-07-30 06:07:16,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2966/ 3125], loss: 0.223, per_step_time: 1412ms, lr: 7.542371e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:16,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.66246 samples/s/p 0:03:44 } +2024-07-30 06:07:19,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2968/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 7.354021e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:19,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.65908 samples/s/p 0:03:41 } +2024-07-30 06:07:22,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2970/ 3125], loss: 0.252, per_step_time: 1414ms, lr: 7.167458e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:22,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.65734 samples/s/p 0:03:39 } +2024-07-30 06:07:25,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2972/ 3125], loss: 0.431, per_step_time: 1414ms, lr: 6.983876e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:25,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.65713 samples/s/p 0:03:36 } +2024-07-30 06:07:28,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2974/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 6.802976e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:28,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.65923 samples/s/p 0:03:33 } +2024-07-30 06:07:31,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2976/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 6.623864e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:31,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.65960 samples/s/p 0:03:30 } +2024-07-30 06:07:33,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2978/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 6.447136e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:33,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.66016 samples/s/p 0:03:27 } +2024-07-30 06:07:36,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2980/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 6.2727925e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:36,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.65940 samples/s/p 0:03:24 } +2024-07-30 06:07:39,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2982/ 3125], loss: 0.104, per_step_time: 1413ms, lr: 6.101131e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:39,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.66074 samples/s/p 0:03:22 } +2024-07-30 06:07:42,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2984/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 5.931854e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:42,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.66031 samples/s/p 0:03:19 } +2024-07-30 06:07:45,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2986/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 5.764663e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:45,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.65965 samples/s/p 0:03:16 } +2024-07-30 06:07:48,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2988/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 5.600452e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:48,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.65924 samples/s/p 0:03:13 } +2024-07-30 06:07:50,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2990/ 3125], loss: 0.353, per_step_time: 1413ms, lr: 5.4374336e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:50,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.66118 samples/s/p 0:03:10 } +2024-07-30 06:07:53,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2992/ 3125], loss: 0.474, per_step_time: 1413ms, lr: 5.277693e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:53,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.65885 samples/s/p 0:03:08 } +2024-07-30 06:07:56,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2994/ 3125], loss: 0.334, per_step_time: 1413ms, lr: 5.120039e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:56,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.65800 samples/s/p 0:03:05 } +2024-07-30 06:07:59,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2996/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 4.965365e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:59,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.65911 samples/s/p 0:03:02 } +2024-07-30 06:08:02,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2998/ 3125], loss: 0.109, per_step_time: 1413ms, lr: 4.812181e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:02,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.66011 samples/s/p 0:02:59 } +2024-07-30 06:08:05,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3000/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 4.6625734e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:05,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.65806 samples/s/p 0:02:56 } +2024-07-30 06:08:07,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3002/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 4.5138595e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:07,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.65840 samples/s/p 0:02:53 } +2024-07-30 06:08:10,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3004/ 3125], loss: 0.333, per_step_time: 1414ms, lr: 4.3684243e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:10,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.65404 samples/s/p 0:02:51 } +2024-07-30 06:08:13,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3006/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 4.225373e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:13,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.65873 samples/s/p 0:02:48 } +2024-07-30 06:08:16,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3008/ 3125], loss: 0.352, per_step_time: 1414ms, lr: 4.0844084e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:16,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.65718 samples/s/p 0:02:45 } +2024-07-30 06:08:19,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3010/ 3125], loss: 0.381, per_step_time: 1413ms, lr: 3.946125e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:19,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.66133 samples/s/p 0:02:42 } +2024-07-30 06:08:22,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3012/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 3.809929e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:22,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.66110 samples/s/p 0:02:39 } +2024-07-30 06:08:24,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3014/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 3.6761163e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:24,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.66012 samples/s/p 0:02:36 } +2024-07-30 06:08:27,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3016/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 3.544986e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:27,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.66139 samples/s/p 0:02:34 } +2024-07-30 06:08:30,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3018/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 3.4165382e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:30,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.66002 samples/s/p 0:02:31 } +2024-07-30 06:08:33,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3020/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 3.2895802e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:33,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.66148 samples/s/p 0:02:28 } +2024-07-30 06:08:36,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3022/ 3125], loss: 0.099, per_step_time: 1415ms, lr: 3.1656027e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:36,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.65331 samples/s/p 0:02:25 } +2024-07-30 06:08:39,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3024/ 3125], loss: 0.406, per_step_time: 1413ms, lr: 3.043711e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:39,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.65938 samples/s/p 0:02:22 } +2024-07-30 06:08:41,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3026/ 3125], loss: 0.065, per_step_time: 1412ms, lr: 2.9245018e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:41,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.66195 samples/s/p 0:02:19 } +2024-07-30 06:08:44,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3028/ 3125], loss: 0.321, per_step_time: 1414ms, lr: 2.8073788e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:44,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.65373 samples/s/p 0:02:17 } +2024-07-30 06:08:47,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3030/ 3125], loss: 0.028, per_step_time: 1413ms, lr: 2.6926397e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:47,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.65976 samples/s/p 0:02:14 } +2024-07-30 06:08:50,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3032/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 2.580881e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:50,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.66037 samples/s/p 0:02:11 } +2024-07-30 06:08:53,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3034/ 3125], loss: 0.190, per_step_time: 1416ms, lr: 2.4709106e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:53,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.64723 samples/s/p 0:02:08 } +2024-07-30 06:08:56,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3036/ 3125], loss: 0.496, per_step_time: 1413ms, lr: 2.3639202e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:56,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.65921 samples/s/p 0:02:05 } +2024-07-30 06:08:58,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3038/ 3125], loss: 0.532, per_step_time: 1414ms, lr: 2.2587179e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:58,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.65410 samples/s/p 0:02:03 } +2024-07-30 06:09:01,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3040/ 3125], loss: 0.358, per_step_time: 1412ms, lr: 2.155602e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:01,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.66330 samples/s/p 0:02:00 } +2024-07-30 06:09:04,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3042/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 2.0557642e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:04,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.65848 samples/s/p 0:01:57 } +2024-07-30 06:09:07,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3044/ 3125], loss: 0.201, per_step_time: 1414ms, lr: 1.9577144e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:07,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.65711 samples/s/p 0:01:54 } +2024-07-30 06:09:10,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3046/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 1.8620491e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:10,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.65902 samples/s/p 0:01:51 } +2024-07-30 06:09:13,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3048/ 3125], loss: 0.417, per_step_time: 1417ms, lr: 1.7693639e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:13,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.64472 samples/s/p 0:01:49 } +2024-07-30 06:09:15,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3050/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 1.6784667e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:15,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.65945 samples/s/p 0:01:46 } +2024-07-30 06:09:18,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3052/ 3125], loss: 0.300, per_step_time: 1415ms, lr: 1.5902519e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:18,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.65254 samples/s/p 0:01:43 } +2024-07-30 06:09:21,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3054/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 1.5044211e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:21,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.65778 samples/s/p 0:01:40 } +2024-07-30 06:09:24,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3056/ 3125], loss: 0.212, per_step_time: 1412ms, lr: 1.4206767e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:24,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.66261 samples/s/p 0:01:37 } +2024-07-30 06:09:27,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3058/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 1.3396143e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:27,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.65871 samples/s/p 0:01:34 } +2024-07-30 06:09:30,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3060/ 3125], loss: 0.296, per_step_time: 1412ms, lr: 1.2612342e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:30,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.66219 samples/s/p 0:01:31 } +2024-07-30 06:09:32,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3062/ 3125], loss: 0.255, per_step_time: 1414ms, lr: 1.1846423e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:32,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.65473 samples/s/p 0:01:29 } +2024-07-30 06:09:35,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3064/ 3125], loss: 0.113, per_step_time: 1413ms, lr: 1.1107325e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:35,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.66126 samples/s/p 0:01:26 } +2024-07-30 06:09:38,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3066/ 3125], loss: 0.314, per_step_time: 1412ms, lr: 1.038909e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:38,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.66186 samples/s/p 0:01:23 } +2024-07-30 06:09:41,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3068/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 9.694695e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:41,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.65778 samples/s/p 0:01:20 } +2024-07-30 06:09:44,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3070/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 9.0271235e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:44,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.66115 samples/s/p 0:01:17 } +2024-07-30 06:09:47,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3072/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 8.380413e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:47,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.65910 samples/s/p 0:01:14 } +2024-07-30 06:09:49,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3074/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 7.7605244e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:49,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.66056 samples/s/p 0:01:12 } +2024-07-30 06:09:52,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3076/ 3125], loss: 0.150, per_step_time: 1412ms, lr: 7.161498e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:52,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.66181 samples/s/p 0:01:09 } +2024-07-30 06:09:55,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3078/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 6.595254e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:55,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.65810 samples/s/p 0:01:06 } +2024-07-30 06:09:58,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3080/ 3125], loss: 0.265, per_step_time: 1414ms, lr: 6.043911e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:58,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.65562 samples/s/p 0:01:03 } +2024-07-30 06:10:01,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3082/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 5.5164096e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:01,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.65836 samples/s/p 0:01:00 } +2024-07-30 06:10:04,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3084/ 3125], loss: 0.305, per_step_time: 1415ms, lr: 5.0157306e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:04,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.65350 samples/s/p 0:00:58 } +2024-07-30 06:10:06,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3086/ 3125], loss: 0.515, per_step_time: 1419ms, lr: 4.5418738e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:06,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.63631 samples/s/p 0:00:55 } +2024-07-30 06:10:09,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3088/ 3125], loss: 0.140, per_step_time: 1415ms, lr: 4.0858983e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:09,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.65053 samples/s/p 0:00:52 } +2024-07-30 06:10:12,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3090/ 3125], loss: 0.113, per_step_time: 1414ms, lr: 3.6537645e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:12,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.65673 samples/s/p 0:00:49 } +2024-07-30 06:10:15,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3092/ 3125], loss: 0.268, per_step_time: 1414ms, lr: 3.2514333e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:15,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.65411 samples/s/p 0:00:46 } +2024-07-30 06:10:18,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3094/ 3125], loss: 0.468, per_step_time: 1413ms, lr: 2.8669833e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:18,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.66110 samples/s/p 0:00:43 } +2024-07-30 06:10:21,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3096/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 2.5063754e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:21,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.66170 samples/s/p 0:00:40 } +2024-07-30 06:10:23,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3098/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 2.1785497e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:23,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.65999 samples/s/p 0:00:38 } +2024-07-30 06:10:26,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3100/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 1.8656253e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:26,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.65919 samples/s/p 0:00:35 } +2024-07-30 06:10:29,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3102/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 1.5825033e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:29,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.66059 samples/s/p 0:00:32 } +2024-07-30 06:10:32,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3104/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 1.3172625e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:32,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.66082 samples/s/p 0:00:29 } +2024-07-30 06:10:35,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3106/ 3125], loss: 0.294, per_step_time: 1412ms, lr: 1.0818243e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:35,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.66216 samples/s/p 0:00:26 } +2024-07-30 06:10:38,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3108/ 3125], loss: 0.070, per_step_time: 1413ms, lr: 8.612871e-11, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:38,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.66150 samples/s/p 0:00:24 } +2024-07-30 06:10:40,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3110/ 3125], loss: 0.126, per_step_time: 1425ms, lr: 6.705522e-11, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:40,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.61160 samples/s/p 0:00:21 } +2024-07-30 06:10:43,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3112/ 3125], loss: 0.257, per_step_time: 1414ms, lr: 5.0663945e-11, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:43,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.65690 samples/s/p 0:00:18 } +2024-07-30 06:10:46,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3114/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 3.606081e-11, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:46,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.65860 samples/s/p 0:00:15 } +2024-07-30 06:10:49,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3116/ 3125], loss: 0.208, per_step_time: 1415ms, lr: 2.3841857e-11, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:49,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.65353 samples/s/p 0:00:12 } +2024-07-30 06:10:52,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3118/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 1.4603138e-11, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:52,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.65894 samples/s/p 0:00:09 } +2024-07-30 06:10:55,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3120/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 7.45058e-12, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:55,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.65818 samples/s/p 0:00:07 } +2024-07-30 06:10:57,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3122/ 3125], loss: 0.388, per_step_time: 1414ms, lr: 2.682209e-12, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:57,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |█████████████████████████████████████████████████ | 5.65672 samples/s/p 0:00:04 } +2024-07-30 06:11:00,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3124/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 2.9802322e-13, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:11:00,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |█████████████████████████████████████████████████ | 5.65813 samples/s/p 0:00:01 } +2024-07-30 06:11:00,848 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 06:11:30,761 - mindformers[mindformers/trainer/base_trainer.py:779] - INFO - .........Training Over!............. diff --git "a/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/2. \345\276\256\350\260\203\346\227\245\345\277\227\344\270\216\351\205\215\347\275\256/finetune_msrun_log/worker_1.log" "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/2. \345\276\256\350\260\203\346\227\245\345\277\227\344\270\216\351\205\215\347\275\256/finetune_msrun_log/worker_1.log" new file mode 100644 index 00000000..22ad15e5 --- /dev/null +++ "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/2. \345\276\256\350\260\203\346\227\245\345\277\227\344\270\216\351\205\215\347\275\256/finetune_msrun_log/worker_1.log" @@ -0,0 +1,10017 @@ +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:499: UserWarning: The value of the smallest subnormal for type is zero. + setattr(self, word, getattr(machar, word).flat[0]) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:89: UserWarning: The value of the smallest subnormal for type is zero. + return self._float_to_str(self.smallest_subnormal) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:499: UserWarning: The value of the smallest subnormal for type is zero. + setattr(self, word, getattr(machar, word).flat[0]) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:89: UserWarning: The value of the smallest subnormal for type is zero. + return self._float_to_str(self.smallest_subnormal) +[WARNING] DISTRIBUTED(978972,ffff965ee010,python):2024-07-30-02:07:40.833.465 [mindspore/ccsrc/distributed/rpc/tcp/tcp_comm.cc:464] Connect] Waiting for the state of the connection to 127.0.0.1:8118 to be connected...Retry number: 1 +[WARNING] DISTRIBUTED(978972,ffff965ee010,python):2024-07-30-02:07:41.833.994 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:194] BuildCluster] Topology build timed out., retry(1/200). +[WARNING] DISTRIBUTED(978972,ffff965ee010,python):2024-07-30-02:07:44.834.154 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:194] BuildCluster] Topology build timed out., retry(2/200). +[WARNING] DISTRIBUTED(978972,ffff965ee010,python):2024-07-30-02:07:47.834.329 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:196] BuildCluster] Cluster is successfully initialized. +[WARNING] DISTRIBUTED(978972,ffff965ee010,python):2024-07-30-02:07:47.834.709 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:260] PostProcess] This node 1 rank id: 1 +[WARNING] DISTRIBUTED(978972,ffff965ee010,python):2024-07-30-02:08:12.545.122 [mindspore/ccsrc/distributed/collective/collective_manager.cc:259] CreateCommunicationGroup] Start to create communication group: hccl_world_group [const vector]{0, 1, 2, 3} +[WARNING] DISTRIBUTED(978972,ffff965ee010,python):2024-07-30-02:08:12.545.640 [mindspore/ccsrc/distributed/collective/collective_manager.cc:335] CreateCommunicationGroup] Begin initialize communication group on the device side: hccl_world_group +[WARNING] DISTRIBUTED(978972,ffff965ee010,python):2024-07-30-02:08:14.464.592 [mindspore/ccsrc/distributed/collective/collective_manager.cc:345] CreateCommunicationGroup] End initialize communication group on the device side: hccl_world_group +2024-07-30 02:08:14,467 - mindformers[mindformers/tools/utils.py:168] - INFO - set strategy path to './output/strategy/ckpt_strategy_rank_1.ckpt' +2024-07-30 02:08:14,501 - mindformers[mindformers/trainer/trainer.py:919] - INFO - Load configs in /home/ma-user/work/mindformers/configs/gpt2/run_gpt2.yaml to build trainer. +2024-07-30 02:08:14,502 - mindformers[mindformers/trainer/trainer.py:949] - INFO - ..........Init Config.......... +2024-07-30 02:08:14,502 - mindformers[mindformers/core/parallel_config.py:45] - INFO - initial recompute_config from dict: {'recompute': True, 'select_recompute': False, 'parallel_optimizer_comm_recompute': False, 'mp_comm_recompute': True, 'recompute_slice_activation': True} +2024-07-30 02:08:14,502 - mindformers[mindformers/core/parallel_config.py:51] - INFO - initial parallel_config from dict: {'data_parallel': 1, 'model_parallel': 4, 'pipeline_stage': 1, 'use_seq_parallel': False, 'micro_batch_num': 1, 'vocab_emb_dp': True, 'gradient_aggregation_group': 4} +2024-07-30 02:08:14,503 - mindformers[mindformers/tools/utils.py:153] - INFO - set output path to '/home/ma-user/work/mindformers/research/output' +2024-07-30 02:08:14,504 - mindformers[mindformers/trainer/base_trainer.py:85] - INFO - Now Running Task is: text_generation, Model is: llama3_8b +2024-07-30 02:08:14,504 - mindformers[mindformers/trainer/base_trainer.py:111] - WARNING - Input model name is not in the supported list or unspecified. +2024-07-30 02:08:14,504 - mindformers[mindformers/trainer/base_trainer.py:112] - WARNING - See the list of supported task and model name: ['baichuan2_13b', 'baichuan2_7b', 'baichuan_7b', 'bloom_176b', 'bloom_560m', 'bloom_65b', 'bloom_7.1b', 'codegeex2_6b', 'codellama_34b', 'common', 'deepseek_33b', 'glm2_6b', 'glm2_6b_lora', 'glm2_6b_ptuning2', 'glm3_6b', 'glm_6b', 'glm_6b_chat', 'glm_6b_lora', 'glm_6b_lora_chat', 'gpt2', 'gpt2_13b', 'gpt2_52b', 'gpt2_lora', 'gpt2_xl', 'gpt2_xl_lora', 'internlm_7b', 'internlm_7b_lora', 'llama2_13b', 'llama2_70b', 'llama2_7b', 'llama_13b', 'llama_65b', 'llama_7b', 'llama_7b_lora', 'pangualpha_13b', 'pangualpha_2_6b', 'qwen_7b', 'qwen_7b_lora', 'skywork_13b', 'yi_34b', 'yi_6b', 'ziya_13b'] +2024-07-30 02:08:14,505 - mindformers[mindformers/trainer/base_trainer.py:113] - WARNING - The default model config: /home/ma-user/work/mindformers/configs/gpt2/run_gpt2.yaml will now be used for the text_generation task +2024-07-30 02:08:14,505 - mindformers[mindformers/trainer/trainer.py:1004] - INFO - ..........Init Model.......... +2024-07-30 02:08:14,505 - mindformers[mindformers/trainer/trainer.py:1027] - INFO - ..........Init Train Dataset.......... +2024-07-30 02:08:14,505 - mindformers[mindformers/trainer/trainer.py:335] - INFO - ==========Trainer Init Success!========== +2024-07-30 02:08:14,505 - mindformers[mindformers/trainer/trainer.py:476] - WARNING - The `finetune_checkpoint` will be deprecated. Please use `resume_from_checkpoint` instead. +2024-07-30 02:08:14,506 - mindformers[mindformers/trainer/trainer.py:1004] - INFO - ..........Init Model.......... +2024-07-30 02:08:14,506 - mindformers[mindformers/trainer/base_trainer.py:176] - INFO - The current parallel mode is semi_auto_parallel, full batch is True,so global batch size will be changed: global_batch_size = batch_size * data_parallel * micro_batch_interleave_num * gradient_accumulation_steps = 32 = 32 * 1 * 1 * 1 +2024-07-30 02:08:14,506 - mindformers[mindformers/trainer/base_trainer.py:624] - INFO - .........Build Dataset For Train.......... +2024-07-30 02:08:14,506 - mindformers[mindformers/trainer/base_trainer.py:353] - INFO - .........Build Dataset From Config.......... +2024-07-30 02:08:14,506 - mindformers[mindformers/dataset/causal_language_model_dataset.py:166] - INFO - Now Create Causal Language Model Dataset. +2024-07-30 02:08:14,514 - mindformers[mindformers/trainer/base_trainer.py:626] - INFO - Create train dataset finish, dataset size:3125 +2024-07-30 02:08:14,514 - mindformers[mindformers/trainer/utils.py:171] - INFO - Will be Training epochs:3, sink_size:2 +2024-07-30 02:08:14,514 - mindformers[mindformers/trainer/utils.py:173] - INFO - Create training dataset finish, dataset size:3125 +2024-07-30 02:08:14,515 - mindformers[mindformers/trainer/base_trainer.py:656] - INFO - .........Build Net For Train.......... +2024-07-30 02:08:14,515 - mindformers[mindformers/trainer/base_trainer.py:387] - INFO - .........Build Network From Config.......... +2024-07-30 02:08:14,516 - mindformers[mindformers/version_control.py:61] - INFO - The Cell Reuse compilation acceleration feature is not supported when the environment variable ENABLE_CELL_REUSE is 0 or MindSpore version is earlier than 2.1.0 or stand_alone mode or pipeline_stages <= 1 +2024-07-30 02:08:14,516 - mindformers[mindformers/version_control.py:65] - INFO - +The current ENABLE_CELL_REUSE=0, please set the environment variable as follows: +export ENABLE_CELL_REUSE=1 to enable the Cell Reuse compilation acceleration feature. +2024-07-30 02:08:14,516 - mindformers[mindformers/version_control.py:74] - INFO - The Cell Reuse compilation acceleration feature only works in pipeline parallel mode(pipeline_stage>1).Current pipeline stage=1, the feature is disabled by default. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:08:14.518.632 [/home/ma-user/work/mindformers/mindformers/modules/transformer/op_parallel_config.py:244] The optimizer shard True in auto_parallel_context is not equal to the optimizer_shard None in the OpParallelConfig. Please check the optimizer_shard to make them consistent. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:08:14.521.356 [/home/ma-user/work/mindformers/mindformers/modules/transformer/op_parallel_config.py:244] The optimizer shard True in auto_parallel_context is not equal to the optimizer_shard None in the OpParallelConfig. Please check the optimizer_shard to make them consistent. +2024-07-30 02:08:14,633 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:08:14.634.447 [mindspore/common/_decorator.py:40] 'Parameter' is deprecated from version 2.3 and will be removed in a future version, use 'add_pipeline_stage' instead. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:08:14.634.577 [mindspore/common/parameter.py:806] This interface may be deleted in the future. +2024-07-30 02:08:14,654 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,675 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,695 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,716 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,737 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,758 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,779 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,800 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,822 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:15,296 - mindformers[mindformers/models/modeling_utils.py:1438] - INFO - model built, but weights is unloaded, since the config has no checkpoint_name_or_path attribute or checkpoint_name_or_path is None. +2024-07-30 02:08:15,494 - mindformers[mindformers/models/modeling_utils.py:1438] - INFO - model built, but weights is unloaded, since the config has no checkpoint_name_or_path attribute or checkpoint_name_or_path is None. +2024-07-30 02:08:15,517 - mindformers[mindformers/trainer/base_trainer.py:543] - INFO - Network Parameters: 3407872. +2024-07-30 02:08:15,517 - mindformers[mindformers/trainer/base_trainer.py:678] - INFO - .........Build Optimizer For Train.......... +2024-07-30 02:08:15,517 - mindformers[mindformers/trainer/base_trainer.py:426] - INFO - .........Build Optimizer From Config.......... +2024-07-30 02:08:15,517 - mindformers[mindformers/trainer/base_trainer.py:459] - INFO - .........Build LR Schedule From Config.......... +2024-07-30 02:08:15,523 - mindformers[mindformers/trainer/optimizer_grouped_parameters.py:74] - WARNING - dynamic_lr_schedule will be reset and invalid when layer_scale is False. +2024-07-30 02:08:15,527 - mindformers[mindformers/trainer/optimizer_grouped_parameters.py:113] - INFO - Param groups = { + "decay": { + "weight_decay": 0.0, + "params": [ + "model.layers.0.attention.wq.mindpet_delta_lora_a", + "model.layers.0.attention.wq.mindpet_delta_lora_b", + "model.layers.0.attention.wv.mindpet_delta_lora_a", + "model.layers.0.attention.wv.mindpet_delta_lora_b", + "model.layers.1.attention.wq.mindpet_delta_lora_a", + "model.layers.1.attention.wq.mindpet_delta_lora_b", + "model.layers.1.attention.wv.mindpet_delta_lora_a", + "model.layers.1.attention.wv.mindpet_delta_lora_b", + "model.layers.2.attention.wq.mindpet_delta_lora_a", + "model.layers.2.attention.wq.mindpet_delta_lora_b", + "model.layers.2.attention.wv.mindpet_delta_lora_a", + "model.layers.2.attention.wv.mindpet_delta_lora_b", + "model.layers.3.attention.wq.mindpet_delta_lora_a", + "model.layers.3.attention.wq.mindpet_delta_lora_b", + "model.layers.3.attention.wv.mindpet_delta_lora_a", + "model.layers.3.attention.wv.mindpet_delta_lora_b", + "model.layers.4.attention.wq.mindpet_delta_lora_a", + "model.layers.4.attention.wq.mindpet_delta_lora_b", + "model.layers.4.attention.wv.mindpet_delta_lora_a", + "model.layers.4.attention.wv.mindpet_delta_lora_b", + "model.layers.5.attention.wq.mindpet_delta_lora_a", + "model.layers.5.attention.wq.mindpet_delta_lora_b", + "model.layers.5.attention.wv.mindpet_delta_lora_a", + "model.layers.5.attention.wv.mindpet_delta_lora_b", + "model.layers.6.attention.wq.mindpet_delta_lora_a", + "model.layers.6.attention.wq.mindpet_delta_lora_b", + "model.layers.6.attention.wv.mindpet_delta_lora_a", + "model.layers.6.attention.wv.mindpet_delta_lora_b", + "model.layers.7.attention.wq.mindpet_delta_lora_a", + "model.layers.7.attention.wq.mindpet_delta_lora_b", + "model.layers.7.attention.wv.mindpet_delta_lora_a", + "model.layers.7.attention.wv.mindpet_delta_lora_b", + "model.layers.8.attention.wq.mindpet_delta_lora_a", + "model.layers.8.attention.wq.mindpet_delta_lora_b", + "model.layers.8.attention.wv.mindpet_delta_lora_a", + "model.layers.8.attention.wv.mindpet_delta_lora_b", + "model.layers.9.attention.wq.mindpet_delta_lora_a", + "model.layers.9.attention.wq.mindpet_delta_lora_b", + "model.layers.9.attention.wv.mindpet_delta_lora_a", + "model.layers.9.attention.wv.mindpet_delta_lora_b", + "model.layers.10.attention.wq.mindpet_delta_lora_a", + "model.layers.10.attention.wq.mindpet_delta_lora_b", + "model.layers.10.attention.wv.mindpet_delta_lora_a", + "model.layers.10.attention.wv.mindpet_delta_lora_b", + "model.layers.11.attention.wq.mindpet_delta_lora_a", + "model.layers.11.attention.wq.mindpet_delta_lora_b", + "model.layers.11.attention.wv.mindpet_delta_lora_a", + "model.layers.11.attention.wv.mindpet_delta_lora_b", + "model.layers.12.attention.wq.mindpet_delta_lora_a", + "model.layers.12.attention.wq.mindpet_delta_lora_b", + "model.layers.12.attention.wv.mindpet_delta_lora_a", + "model.layers.12.attention.wv.mindpet_delta_lora_b", + "model.layers.13.attention.wq.mindpet_delta_lora_a", + "model.layers.13.attention.wq.mindpet_delta_lora_b", + "model.layers.13.attention.wv.mindpet_delta_lora_a", + "model.layers.13.attention.wv.mindpet_delta_lora_b", + "model.layers.14.attention.wq.mindpet_delta_lora_a", + "model.layers.14.attention.wq.mindpet_delta_lora_b", + "model.layers.14.attention.wv.mindpet_delta_lora_a", + "model.layers.14.attention.wv.mindpet_delta_lora_b", + "model.layers.15.attention.wq.mindpet_delta_lora_a", + "model.layers.15.attention.wq.mindpet_delta_lora_b", + "model.layers.15.attention.wv.mindpet_delta_lora_a", + "model.layers.15.attention.wv.mindpet_delta_lora_b", + "model.layers.16.attention.wq.mindpet_delta_lora_a", + "model.layers.16.attention.wq.mindpet_delta_lora_b", + "model.layers.16.attention.wv.mindpet_delta_lora_a", + "model.layers.16.attention.wv.mindpet_delta_lora_b", + "model.layers.17.attention.wq.mindpet_delta_lora_a", + "model.layers.17.attention.wq.mindpet_delta_lora_b", + "model.layers.17.attention.wv.mindpet_delta_lora_a", + "model.layers.17.attention.wv.mindpet_delta_lora_b", + "model.layers.18.attention.wq.mindpet_delta_lora_a", + "model.layers.18.attention.wq.mindpet_delta_lora_b", + "model.layers.18.attention.wv.mindpet_delta_lora_a", + "model.layers.18.attention.wv.mindpet_delta_lora_b", + "model.layers.19.attention.wq.mindpet_delta_lora_a", + "model.layers.19.attention.wq.mindpet_delta_lora_b", + "model.layers.19.attention.wv.mindpet_delta_lora_a", + "model.layers.19.attention.wv.mindpet_delta_lora_b", + "model.layers.20.attention.wq.mindpet_delta_lora_a", + "model.layers.20.attention.wq.mindpet_delta_lora_b", + "model.layers.20.attention.wv.mindpet_delta_lora_a", + "model.layers.20.attention.wv.mindpet_delta_lora_b", + "model.layers.21.attention.wq.mindpet_delta_lora_a", + "model.layers.21.attention.wq.mindpet_delta_lora_b", + "model.layers.21.attention.wv.mindpet_delta_lora_a", + "model.layers.21.attention.wv.mindpet_delta_lora_b", + "model.layers.22.attention.wq.mindpet_delta_lora_a", + "model.layers.22.attention.wq.mindpet_delta_lora_b", + "model.layers.22.attention.wv.mindpet_delta_lora_a", + "model.layers.22.attention.wv.mindpet_delta_lora_b", + "model.layers.23.attention.wq.mindpet_delta_lora_a", + "model.layers.23.attention.wq.mindpet_delta_lora_b", + "model.layers.23.attention.wv.mindpet_delta_lora_a", + "model.layers.23.attention.wv.mindpet_delta_lora_b", + "model.layers.24.attention.wq.mindpet_delta_lora_a", + "model.layers.24.attention.wq.mindpet_delta_lora_b", + "model.layers.24.attention.wv.mindpet_delta_lora_a", + "model.layers.24.attention.wv.mindpet_delta_lora_b", + "model.layers.25.attention.wq.mindpet_delta_lora_a", + "model.layers.25.attention.wq.mindpet_delta_lora_b", + "model.layers.25.attention.wv.mindpet_delta_lora_a", + "model.layers.25.attention.wv.mindpet_delta_lora_b", + "model.layers.26.attention.wq.mindpet_delta_lora_a", + "model.layers.26.attention.wq.mindpet_delta_lora_b", + "model.layers.26.attention.wv.mindpet_delta_lora_a", + "model.layers.26.attention.wv.mindpet_delta_lora_b", + "model.layers.27.attention.wq.mindpet_delta_lora_a", + "model.layers.27.attention.wq.mindpet_delta_lora_b", + "model.layers.27.attention.wv.mindpet_delta_lora_a", + "model.layers.27.attention.wv.mindpet_delta_lora_b", + "model.layers.28.attention.wq.mindpet_delta_lora_a", + "model.layers.28.attention.wq.mindpet_delta_lora_b", + "model.layers.28.attention.wv.mindpet_delta_lora_a", + "model.layers.28.attention.wv.mindpet_delta_lora_b", + "model.layers.29.attention.wq.mindpet_delta_lora_a", + "model.layers.29.attention.wq.mindpet_delta_lora_b", + "model.layers.29.attention.wv.mindpet_delta_lora_a", + "model.layers.29.attention.wv.mindpet_delta_lora_b", + "model.layers.30.attention.wq.mindpet_delta_lora_a", + "model.layers.30.attention.wq.mindpet_delta_lora_b", + "model.layers.30.attention.wv.mindpet_delta_lora_a", + "model.layers.30.attention.wv.mindpet_delta_lora_b", + "model.layers.31.attention.wq.mindpet_delta_lora_a", + "model.layers.31.attention.wq.mindpet_delta_lora_b", + "model.layers.31.attention.wv.mindpet_delta_lora_a", + "model.layers.31.attention.wv.mindpet_delta_lora_b" + ] + } +} +2024-07-30 02:08:15,627 - mindformers[mindformers/trainer/base_trainer.py:683] - INFO - .........Build Running Wrapper From Config For Train.......... +2024-07-30 02:08:15,627 - mindformers[mindformers/trainer/base_trainer.py:496] - INFO - .........Build Model Wrapper for Train From Config.......... +2024-07-30 02:08:15,633 - mindformers[mindformers/trainer/base_trainer.py:687] - INFO - .........Build Callbacks For Train.......... +2024-07-30 02:08:15,635 - mindformers[mindformers/core/callback/callback.py:533] - INFO - Integrated_save is changed to False when using auto_parallel. +2024-07-30 02:08:15,636 - mindformers[mindformers/trainer/base_trainer.py:721] - INFO - .........Starting Init Train Model.......... +2024-07-30 02:08:15,636 - mindformers[mindformers/trainer/utils.py:736] - INFO - ............Start load checkpoint from checkpoint............ +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:11.672.232 [mindspore/train/serialization.py:1369] model.tok_embeddings.embedding_weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:16.688.114 [mindspore/train/serialization.py:1369] model.layers.0.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:16.688.856 [mindspore/train/serialization.py:1369] model.layers.0.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:16.689.342 [mindspore/train/serialization.py:1369] model.layers.0.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:16.831.780 [mindspore/train/serialization.py:1369] model.layers.0.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:16.870.165 [mindspore/train/serialization.py:1369] model.layers.0.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:16.909.305 [mindspore/train/serialization.py:1369] model.layers.0.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:17.523.79 [mindspore/train/serialization.py:1369] model.layers.0.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:17.624.655 [mindspore/train/serialization.py:1369] model.layers.0.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:18.192.900 [mindspore/train/serialization.py:1369] model.layers.0.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:18.754.163 [mindspore/train/serialization.py:1369] model.layers.1.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:18.755.028 [mindspore/train/serialization.py:1369] model.layers.1.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:18.755.464 [mindspore/train/serialization.py:1369] model.layers.1.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:18.894.765 [mindspore/train/serialization.py:1369] model.layers.1.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:18.930.594 [mindspore/train/serialization.py:1369] model.layers.1.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:18.966.287 [mindspore/train/serialization.py:1369] model.layers.1.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:19.104.608 [mindspore/train/serialization.py:1369] model.layers.1.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:19.679.604 [mindspore/train/serialization.py:1369] model.layers.1.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:20.244.644 [mindspore/train/serialization.py:1369] model.layers.1.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:20.810.690 [mindspore/train/serialization.py:1369] model.layers.2.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:20.811.479 [mindspore/train/serialization.py:1369] model.layers.2.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:20.811.916 [mindspore/train/serialization.py:1369] model.layers.2.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:20.956.562 [mindspore/train/serialization.py:1369] model.layers.2.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:20.994.601 [mindspore/train/serialization.py:1369] model.layers.2.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:21.317.05 [mindspore/train/serialization.py:1369] model.layers.2.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:21.179.034 [mindspore/train/serialization.py:1369] model.layers.2.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:21.776.675 [mindspore/train/serialization.py:1369] model.layers.2.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:22.338.887 [mindspore/train/serialization.py:1369] model.layers.2.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:22.908.638 [mindspore/train/serialization.py:1369] model.layers.3.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:22.909.576 [mindspore/train/serialization.py:1369] model.layers.3.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:22.910.037 [mindspore/train/serialization.py:1369] model.layers.3.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:23.759.07 [mindspore/train/serialization.py:1369] model.layers.3.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:23.123.883 [mindspore/train/serialization.py:1369] model.layers.3.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:23.166.503 [mindspore/train/serialization.py:1369] model.layers.3.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:23.325.737 [mindspore/train/serialization.py:1369] model.layers.3.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:23.884.098 [mindspore/train/serialization.py:1369] model.layers.3.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:24.453.123 [mindspore/train/serialization.py:1369] model.layers.3.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:25.143.88 [mindspore/train/serialization.py:1369] model.layers.4.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:25.152.74 [mindspore/train/serialization.py:1369] model.layers.4.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:25.157.28 [mindspore/train/serialization.py:1369] model.layers.4.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:25.190.901 [mindspore/train/serialization.py:1369] model.layers.4.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:25.267.990 [mindspore/train/serialization.py:1369] model.layers.4.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:25.306.188 [mindspore/train/serialization.py:1369] model.layers.4.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:25.480.379 [mindspore/train/serialization.py:1369] model.layers.4.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:26.461.85 [mindspore/train/serialization.py:1369] model.layers.4.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:26.616.773 [mindspore/train/serialization.py:1369] model.layers.4.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:27.192.945 [mindspore/train/serialization.py:1369] model.layers.5.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:27.193.754 [mindspore/train/serialization.py:1369] model.layers.5.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:27.194.222 [mindspore/train/serialization.py:1369] model.layers.5.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:27.352.039 [mindspore/train/serialization.py:1369] model.layers.5.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:27.388.913 [mindspore/train/serialization.py:1369] model.layers.5.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:27.427.433 [mindspore/train/serialization.py:1369] model.layers.5.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:27.601.804 [mindspore/train/serialization.py:1369] model.layers.5.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:28.169.653 [mindspore/train/serialization.py:1369] model.layers.5.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:28.739.854 [mindspore/train/serialization.py:1369] model.layers.5.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:29.311.781 [mindspore/train/serialization.py:1369] model.layers.6.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:29.312.635 [mindspore/train/serialization.py:1369] model.layers.6.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:29.313.101 [mindspore/train/serialization.py:1369] model.layers.6.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:29.487.208 [mindspore/train/serialization.py:1369] model.layers.6.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:29.532.151 [mindspore/train/serialization.py:1369] model.layers.6.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:29.570.605 [mindspore/train/serialization.py:1369] model.layers.6.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:29.765.152 [mindspore/train/serialization.py:1369] model.layers.6.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:30.368.292 [mindspore/train/serialization.py:1369] model.layers.6.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:30.997.168 [mindspore/train/serialization.py:1369] model.layers.6.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:31.601.404 [mindspore/train/serialization.py:1369] model.layers.7.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:31.602.367 [mindspore/train/serialization.py:1369] model.layers.7.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:31.602.807 [mindspore/train/serialization.py:1369] model.layers.7.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:31.766.124 [mindspore/train/serialization.py:1369] model.layers.7.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:31.807.447 [mindspore/train/serialization.py:1369] model.layers.7.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:31.864.309 [mindspore/train/serialization.py:1369] model.layers.7.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:32.316.29 [mindspore/train/serialization.py:1369] model.layers.7.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:32.620.842 [mindspore/train/serialization.py:1369] model.layers.7.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:33.229.256 [mindspore/train/serialization.py:1369] model.layers.7.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:33.800.019 [mindspore/train/serialization.py:1369] model.layers.8.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:33.800.954 [mindspore/train/serialization.py:1369] model.layers.8.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:33.801.515 [mindspore/train/serialization.py:1369] model.layers.8.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:33.966.836 [mindspore/train/serialization.py:1369] model.layers.8.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:34.191.10 [mindspore/train/serialization.py:1369] model.layers.8.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:34.683.83 [mindspore/train/serialization.py:1369] model.layers.8.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:34.240.037 [mindspore/train/serialization.py:1369] model.layers.8.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:34.796.689 [mindspore/train/serialization.py:1369] model.layers.8.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:35.388.503 [mindspore/train/serialization.py:1369] model.layers.8.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:35.979.289 [mindspore/train/serialization.py:1369] model.layers.9.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:35.980.181 [mindspore/train/serialization.py:1369] model.layers.9.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:35.980.742 [mindspore/train/serialization.py:1369] model.layers.9.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:36.158.186 [mindspore/train/serialization.py:1369] model.layers.9.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:36.208.036 [mindspore/train/serialization.py:1369] model.layers.9.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:36.267.517 [mindspore/train/serialization.py:1369] model.layers.9.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:36.519.277 [mindspore/train/serialization.py:1369] model.layers.9.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:37.102.008 [mindspore/train/serialization.py:1369] model.layers.9.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:37.744.175 [mindspore/train/serialization.py:1369] model.layers.9.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:38.344.167 [mindspore/train/serialization.py:1369] model.layers.10.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:38.345.056 [mindspore/train/serialization.py:1369] model.layers.10.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:38.345.750 [mindspore/train/serialization.py:1369] model.layers.10.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:38.551.584 [mindspore/train/serialization.py:1369] model.layers.10.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:38.606.891 [mindspore/train/serialization.py:1369] model.layers.10.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:38.689.840 [mindspore/train/serialization.py:1369] model.layers.10.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:38.863.909 [mindspore/train/serialization.py:1369] model.layers.10.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:39.425.137 [mindspore/train/serialization.py:1369] model.layers.10.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:40.733.48 [mindspore/train/serialization.py:1369] model.layers.10.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:40.647.482 [mindspore/train/serialization.py:1369] model.layers.11.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:40.648.625 [mindspore/train/serialization.py:1369] model.layers.11.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:40.649.215 [mindspore/train/serialization.py:1369] model.layers.11.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:40.820.089 [mindspore/train/serialization.py:1369] model.layers.11.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:40.897.128 [mindspore/train/serialization.py:1369] model.layers.11.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:40.976.496 [mindspore/train/serialization.py:1369] model.layers.11.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:41.158.648 [mindspore/train/serialization.py:1369] model.layers.11.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:41.732.859 [mindspore/train/serialization.py:1369] model.layers.11.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:42.287.144 [mindspore/train/serialization.py:1369] model.layers.11.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:42.880.334 [mindspore/train/serialization.py:1369] model.layers.12.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:42.881.203 [mindspore/train/serialization.py:1369] model.layers.12.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:42.881.702 [mindspore/train/serialization.py:1369] model.layers.12.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:43.970.32 [mindspore/train/serialization.py:1369] model.layers.12.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:43.148.728 [mindspore/train/serialization.py:1369] model.layers.12.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:43.201.457 [mindspore/train/serialization.py:1369] model.layers.12.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:43.392.902 [mindspore/train/serialization.py:1369] model.layers.12.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:44.251.81 [mindspore/train/serialization.py:1369] model.layers.12.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:44.621.688 [mindspore/train/serialization.py:1369] model.layers.12.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:45.224.077 [mindspore/train/serialization.py:1369] model.layers.13.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:45.225.198 [mindspore/train/serialization.py:1369] model.layers.13.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:45.225.747 [mindspore/train/serialization.py:1369] model.layers.13.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:45.396.149 [mindspore/train/serialization.py:1369] model.layers.13.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:45.463.909 [mindspore/train/serialization.py:1369] model.layers.13.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:45.525.039 [mindspore/train/serialization.py:1369] model.layers.13.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:45.694.248 [mindspore/train/serialization.py:1369] model.layers.13.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:46.259.545 [mindspore/train/serialization.py:1369] model.layers.13.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:46.827.648 [mindspore/train/serialization.py:1369] model.layers.13.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:47.386.830 [mindspore/train/serialization.py:1369] model.layers.14.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:47.387.665 [mindspore/train/serialization.py:1369] model.layers.14.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:47.388.133 [mindspore/train/serialization.py:1369] model.layers.14.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:47.558.485 [mindspore/train/serialization.py:1369] model.layers.14.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:47.614.481 [mindspore/train/serialization.py:1369] model.layers.14.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:47.671.431 [mindspore/train/serialization.py:1369] model.layers.14.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:47.843.500 [mindspore/train/serialization.py:1369] model.layers.14.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:48.399.883 [mindspore/train/serialization.py:1369] model.layers.14.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:48.952.421 [mindspore/train/serialization.py:1369] model.layers.14.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:49.802.922 [mindspore/train/serialization.py:1369] model.layers.15.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:49.803.762 [mindspore/train/serialization.py:1369] model.layers.15.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:49.804.220 [mindspore/train/serialization.py:1369] model.layers.15.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:49.971.489 [mindspore/train/serialization.py:1369] model.layers.15.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:50.212.32 [mindspore/train/serialization.py:1369] model.layers.15.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:50.685.17 [mindspore/train/serialization.py:1369] model.layers.15.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:50.241.834 [mindspore/train/serialization.py:1369] model.layers.15.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:50.856.516 [mindspore/train/serialization.py:1369] model.layers.15.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:51.449.522 [mindspore/train/serialization.py:1369] model.layers.15.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:52.694.76 [mindspore/train/serialization.py:1369] model.layers.16.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:52.702.90 [mindspore/train/serialization.py:1369] model.layers.16.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:52.707.35 [mindspore/train/serialization.py:1369] model.layers.16.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:52.241.193 [mindspore/train/serialization.py:1369] model.layers.16.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:52.291.146 [mindspore/train/serialization.py:1369] model.layers.16.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:52.340.770 [mindspore/train/serialization.py:1369] model.layers.16.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:52.532.875 [mindspore/train/serialization.py:1369] model.layers.16.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:53.130.223 [mindspore/train/serialization.py:1369] model.layers.16.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:53.711.744 [mindspore/train/serialization.py:1369] model.layers.16.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:54.270.028 [mindspore/train/serialization.py:1369] model.layers.17.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:54.270.952 [mindspore/train/serialization.py:1369] model.layers.17.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:54.271.529 [mindspore/train/serialization.py:1369] model.layers.17.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:54.448.193 [mindspore/train/serialization.py:1369] model.layers.17.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:54.524.596 [mindspore/train/serialization.py:1369] model.layers.17.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:54.572.851 [mindspore/train/serialization.py:1369] model.layers.17.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:54.739.662 [mindspore/train/serialization.py:1369] model.layers.17.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:55.310.002 [mindspore/train/serialization.py:1369] model.layers.17.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:55.877.787 [mindspore/train/serialization.py:1369] model.layers.17.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:56.489.397 [mindspore/train/serialization.py:1369] model.layers.18.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:56.490.234 [mindspore/train/serialization.py:1369] model.layers.18.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:56.490.705 [mindspore/train/serialization.py:1369] model.layers.18.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:56.655.035 [mindspore/train/serialization.py:1369] model.layers.18.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:56.717.786 [mindspore/train/serialization.py:1369] model.layers.18.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:56.791.524 [mindspore/train/serialization.py:1369] model.layers.18.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:56.979.422 [mindspore/train/serialization.py:1369] model.layers.18.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:57.564.292 [mindspore/train/serialization.py:1369] model.layers.18.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:58.136.977 [mindspore/train/serialization.py:1369] model.layers.18.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:58.725.140 [mindspore/train/serialization.py:1369] model.layers.19.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:58.725.983 [mindspore/train/serialization.py:1369] model.layers.19.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:58.726.468 [mindspore/train/serialization.py:1369] model.layers.19.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:58.901.828 [mindspore/train/serialization.py:1369] model.layers.19.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:58.948.454 [mindspore/train/serialization.py:1369] model.layers.19.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:59.112.68 [mindspore/train/serialization.py:1369] model.layers.19.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:59.187.603 [mindspore/train/serialization.py:1369] model.layers.19.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:10:59.750.086 [mindspore/train/serialization.py:1369] model.layers.19.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:00.309.242 [mindspore/train/serialization.py:1369] model.layers.19.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:00.871.388 [mindspore/train/serialization.py:1369] model.layers.20.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:00.872.226 [mindspore/train/serialization.py:1369] model.layers.20.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:00.872.722 [mindspore/train/serialization.py:1369] model.layers.20.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:01.438.62 [mindspore/train/serialization.py:1369] model.layers.20.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:01.920.46 [mindspore/train/serialization.py:1369] model.layers.20.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:01.139.207 [mindspore/train/serialization.py:1369] model.layers.20.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:01.321.532 [mindspore/train/serialization.py:1369] model.layers.20.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:01.955.792 [mindspore/train/serialization.py:1369] model.layers.20.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:02.527.515 [mindspore/train/serialization.py:1369] model.layers.20.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:03.875.21 [mindspore/train/serialization.py:1369] model.layers.21.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:03.883.38 [mindspore/train/serialization.py:1369] model.layers.21.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:03.888.39 [mindspore/train/serialization.py:1369] model.layers.21.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:03.258.230 [mindspore/train/serialization.py:1369] model.layers.21.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:03.305.099 [mindspore/train/serialization.py:1369] model.layers.21.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:03.352.629 [mindspore/train/serialization.py:1369] model.layers.21.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:03.514.705 [mindspore/train/serialization.py:1369] model.layers.21.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:04.723.26 [mindspore/train/serialization.py:1369] model.layers.21.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:04.658.818 [mindspore/train/serialization.py:1369] model.layers.21.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:05.256.490 [mindspore/train/serialization.py:1369] model.layers.22.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:05.257.353 [mindspore/train/serialization.py:1369] model.layers.22.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:05.257.789 [mindspore/train/serialization.py:1369] model.layers.22.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:05.434.114 [mindspore/train/serialization.py:1369] model.layers.22.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:05.482.784 [mindspore/train/serialization.py:1369] model.layers.22.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:05.582.869 [mindspore/train/serialization.py:1369] model.layers.22.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:05.794.419 [mindspore/train/serialization.py:1369] model.layers.22.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:06.426.099 [mindspore/train/serialization.py:1369] model.layers.22.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:06.988.391 [mindspore/train/serialization.py:1369] model.layers.22.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:07.594.990 [mindspore/train/serialization.py:1369] model.layers.23.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:07.595.783 [mindspore/train/serialization.py:1369] model.layers.23.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:07.596.226 [mindspore/train/serialization.py:1369] model.layers.23.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:07.772.459 [mindspore/train/serialization.py:1369] model.layers.23.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:07.820.293 [mindspore/train/serialization.py:1369] model.layers.23.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:07.866.190 [mindspore/train/serialization.py:1369] model.layers.23.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:08.356.11 [mindspore/train/serialization.py:1369] model.layers.23.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:08.590.514 [mindspore/train/serialization.py:1369] model.layers.23.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:09.141.587 [mindspore/train/serialization.py:1369] model.layers.23.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:09.707.555 [mindspore/train/serialization.py:1369] model.layers.24.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:09.708.442 [mindspore/train/serialization.py:1369] model.layers.24.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:09.708.920 [mindspore/train/serialization.py:1369] model.layers.24.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:09.877.327 [mindspore/train/serialization.py:1369] model.layers.24.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:09.940.670 [mindspore/train/serialization.py:1369] model.layers.24.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:09.989.331 [mindspore/train/serialization.py:1369] model.layers.24.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:10.160.487 [mindspore/train/serialization.py:1369] model.layers.24.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:10.733.057 [mindspore/train/serialization.py:1369] model.layers.24.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:11.293.116 [mindspore/train/serialization.py:1369] model.layers.24.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:11.857.980 [mindspore/train/serialization.py:1369] model.layers.25.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:11.859.031 [mindspore/train/serialization.py:1369] model.layers.25.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:11.859.625 [mindspore/train/serialization.py:1369] model.layers.25.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:12.183.424 [mindspore/train/serialization.py:1369] model.layers.25.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:12.230.289 [mindspore/train/serialization.py:1369] model.layers.25.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:12.275.716 [mindspore/train/serialization.py:1369] model.layers.25.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:12.449.565 [mindspore/train/serialization.py:1369] model.layers.25.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:13.198.2 [mindspore/train/serialization.py:1369] model.layers.25.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:13.616.671 [mindspore/train/serialization.py:1369] model.layers.25.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:14.241.933 [mindspore/train/serialization.py:1369] model.layers.26.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:14.242.667 [mindspore/train/serialization.py:1369] model.layers.26.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:14.243.122 [mindspore/train/serialization.py:1369] model.layers.26.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:14.506.002 [mindspore/train/serialization.py:1369] model.layers.26.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:14.556.072 [mindspore/train/serialization.py:1369] model.layers.26.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:14.602.838 [mindspore/train/serialization.py:1369] model.layers.26.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:14.774.571 [mindspore/train/serialization.py:1369] model.layers.26.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:15.342.402 [mindspore/train/serialization.py:1369] model.layers.26.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:15.897.817 [mindspore/train/serialization.py:1369] model.layers.26.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:16.595.975 [mindspore/train/serialization.py:1369] model.layers.27.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:16.596.900 [mindspore/train/serialization.py:1369] model.layers.27.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:16.597.341 [mindspore/train/serialization.py:1369] model.layers.27.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:16.817.999 [mindspore/train/serialization.py:1369] model.layers.27.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:16.886.906 [mindspore/train/serialization.py:1369] model.layers.27.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:16.933.904 [mindspore/train/serialization.py:1369] model.layers.27.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:17.104.455 [mindspore/train/serialization.py:1369] model.layers.27.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:17.681.515 [mindspore/train/serialization.py:1369] model.layers.27.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:18.301.924 [mindspore/train/serialization.py:1369] model.layers.27.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:18.862.052 [mindspore/train/serialization.py:1369] model.layers.28.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:18.862.943 [mindspore/train/serialization.py:1369] model.layers.28.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:18.863.389 [mindspore/train/serialization.py:1369] model.layers.28.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:19.309.55 [mindspore/train/serialization.py:1369] model.layers.28.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:19.821.73 [mindspore/train/serialization.py:1369] model.layers.28.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:19.126.509 [mindspore/train/serialization.py:1369] model.layers.28.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:19.297.024 [mindspore/train/serialization.py:1369] model.layers.28.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:19.856.755 [mindspore/train/serialization.py:1369] model.layers.28.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:20.410.665 [mindspore/train/serialization.py:1369] model.layers.28.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:20.989.796 [mindspore/train/serialization.py:1369] model.layers.29.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:20.990.638 [mindspore/train/serialization.py:1369] model.layers.29.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:20.991.091 [mindspore/train/serialization.py:1369] model.layers.29.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:21.163.057 [mindspore/train/serialization.py:1369] model.layers.29.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:21.212.664 [mindspore/train/serialization.py:1369] model.layers.29.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:21.259.342 [mindspore/train/serialization.py:1369] model.layers.29.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:21.431.569 [mindspore/train/serialization.py:1369] model.layers.29.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:21.993.586 [mindspore/train/serialization.py:1369] model.layers.29.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:22.568.109 [mindspore/train/serialization.py:1369] model.layers.29.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:23.130.867 [mindspore/train/serialization.py:1369] model.layers.30.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:23.131.669 [mindspore/train/serialization.py:1369] model.layers.30.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:23.132.128 [mindspore/train/serialization.py:1369] model.layers.30.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:23.317.461 [mindspore/train/serialization.py:1369] model.layers.30.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:23.393.007 [mindspore/train/serialization.py:1369] model.layers.30.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:23.476.340 [mindspore/train/serialization.py:1369] model.layers.30.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:23.645.977 [mindspore/train/serialization.py:1369] model.layers.30.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:24.199.812 [mindspore/train/serialization.py:1369] model.layers.30.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:24.758.847 [mindspore/train/serialization.py:1369] model.layers.30.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:25.320.549 [mindspore/train/serialization.py:1369] model.layers.31.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:25.321.359 [mindspore/train/serialization.py:1369] model.layers.31.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:25.321.794 [mindspore/train/serialization.py:1369] model.layers.31.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:25.492.011 [mindspore/train/serialization.py:1369] model.layers.31.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:25.538.203 [mindspore/train/serialization.py:1369] model.layers.31.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:25.583.711 [mindspore/train/serialization.py:1369] model.layers.31.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:25.755.061 [mindspore/train/serialization.py:1369] model.layers.31.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:26.364.786 [mindspore/train/serialization.py:1369] model.layers.31.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:26.970.488 [mindspore/train/serialization.py:1369] model.layers.31.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:27.633.303 [mindspore/train/serialization.py:1369] model.norm_out.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:27.634.151 [mindspore/train/serialization.py:1369] lm_head.weight is not init while load ckpt. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:57.757.810 [mindspore/train/serialization.py:195] The type of model.layers.0.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:11:57.762.114 [mindspore/train/serialization.py:195] The type of model.layers.0.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:12:06.584.447 [mindspore/train/serialization.py:195] The type of model.layers.1.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:12:06.588.414 [mindspore/train/serialization.py:195] The type of model.layers.1.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:12:15.432.123 [mindspore/train/serialization.py:195] The type of model.layers.2.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:12:15.436.097 [mindspore/train/serialization.py:195] The type of model.layers.2.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:12:24.248.843 [mindspore/train/serialization.py:195] The type of model.layers.3.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:12:24.252.798 [mindspore/train/serialization.py:195] The type of model.layers.3.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:12:33.953.82 [mindspore/train/serialization.py:195] The type of model.layers.4.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:12:33.994.37 [mindspore/train/serialization.py:195] The type of model.layers.4.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:12:41.943.382 [mindspore/train/serialization.py:195] The type of model.layers.5.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:12:41.947.309 [mindspore/train/serialization.py:195] The type of model.layers.5.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:12:50.773.231 [mindspore/train/serialization.py:195] The type of model.layers.6.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:12:50.777.854 [mindspore/train/serialization.py:195] The type of model.layers.6.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:12:59.573.642 [mindspore/train/serialization.py:195] The type of model.layers.7.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:12:59.577.505 [mindspore/train/serialization.py:195] The type of model.layers.7.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:13:08.329.097 [mindspore/train/serialization.py:195] The type of model.layers.8.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:13:08.333.195 [mindspore/train/serialization.py:195] The type of model.layers.8.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:13:17.203.865 [mindspore/train/serialization.py:195] The type of model.layers.9.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:13:17.207.767 [mindspore/train/serialization.py:195] The type of model.layers.9.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:13:26.737.39 [mindspore/train/serialization.py:195] The type of model.layers.10.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:13:26.778.88 [mindspore/train/serialization.py:195] The type of model.layers.10.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:13:35.266.41 [mindspore/train/serialization.py:195] The type of model.layers.11.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:13:35.305.95 [mindspore/train/serialization.py:195] The type of model.layers.11.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:13:43.945.286 [mindspore/train/serialization.py:195] The type of model.layers.12.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:13:43.949.303 [mindspore/train/serialization.py:195] The type of model.layers.12.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:13:52.874.696 [mindspore/train/serialization.py:195] The type of model.layers.13.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:13:52.878.745 [mindspore/train/serialization.py:195] The type of model.layers.13.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:14:01.784.197 [mindspore/train/serialization.py:195] The type of model.layers.14.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:14:01.788.370 [mindspore/train/serialization.py:195] The type of model.layers.14.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:14:10.889.082 [mindspore/train/serialization.py:195] The type of model.layers.15.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:14:10.892.990 [mindspore/train/serialization.py:195] The type of model.layers.15.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:14:19.723.336 [mindspore/train/serialization.py:195] The type of model.layers.16.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:14:19.727.511 [mindspore/train/serialization.py:195] The type of model.layers.16.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:14:28.558.768 [mindspore/train/serialization.py:195] The type of model.layers.17.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:14:28.562.744 [mindspore/train/serialization.py:195] The type of model.layers.17.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:14:37.402.696 [mindspore/train/serialization.py:195] The type of model.layers.18.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:14:37.406.863 [mindspore/train/serialization.py:195] The type of model.layers.18.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:14:46.247.498 [mindspore/train/serialization.py:195] The type of model.layers.19.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:14:46.251.532 [mindspore/train/serialization.py:195] The type of model.layers.19.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:14:55.539.074 [mindspore/train/serialization.py:195] The type of model.layers.20.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:14:55.543.139 [mindspore/train/serialization.py:195] The type of model.layers.20.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:15:05.982.69 [mindspore/train/serialization.py:195] The type of model.layers.21.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:15:05.102.257 [mindspore/train/serialization.py:195] The type of model.layers.21.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:15:14.289.949 [mindspore/train/serialization.py:195] The type of model.layers.22.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:15:14.294.073 [mindspore/train/serialization.py:195] The type of model.layers.22.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:15:23.175.348 [mindspore/train/serialization.py:195] The type of model.layers.23.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:15:23.179.339 [mindspore/train/serialization.py:195] The type of model.layers.23.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:15:32.403.68 [mindspore/train/serialization.py:195] The type of model.layers.24.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:15:32.445.56 [mindspore/train/serialization.py:195] The type of model.layers.24.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:15:40.837.307 [mindspore/train/serialization.py:195] The type of model.layers.25.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:15:40.841.287 [mindspore/train/serialization.py:195] The type of model.layers.25.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:15:49.585.808 [mindspore/train/serialization.py:195] The type of model.layers.26.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:15:49.589.904 [mindspore/train/serialization.py:195] The type of model.layers.26.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:15:58.812.777 [mindspore/train/serialization.py:195] The type of model.layers.27.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:15:58.816.665 [mindspore/train/serialization.py:195] The type of model.layers.27.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:16:07.670.228 [mindspore/train/serialization.py:195] The type of model.layers.28.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:16:07.674.293 [mindspore/train/serialization.py:195] The type of model.layers.28.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:16:16.539.427 [mindspore/train/serialization.py:195] The type of model.layers.29.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:16:16.543.387 [mindspore/train/serialization.py:195] The type of model.layers.29.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:16:25.345.776 [mindspore/train/serialization.py:195] The type of model.layers.30.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:16:25.349.901 [mindspore/train/serialization.py:195] The type of model.layers.30.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:16:34.407.067 [mindspore/train/serialization.py:195] The type of model.layers.31.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:16:34.411.022 [mindspore/train/serialization.py:195] The type of model.layers.31.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:16:43.329.326 [mindspore/train/serialization.py:195] The type of model.norm_out.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:17:05.405.710 [mindspore/train/serialization.py:1456] For 'load_param_into_net', 128 parameters in the 'net' are not loaded, because they are not in the 'parameter_dict', please check whether the network structure is consistent when training and loading checkpoint. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:17:05.406.157 [mindspore/train/serialization.py:1460] ['model.layers.0.attention.wq.mindpet_delta_lora_a', 'model.layers.0.attention.wq.mindpet_delta_lora_b', 'model.layers.0.attention.wv.mindpet_delta_lora_a', 'model.layers.0.attention.wv.mindpet_delta_lora_b', 'model.layers.1.attention.wq.mindpet_delta_lora_a', 'model.layers.1.attention.wq.mindpet_delta_lora_b', 'model.layers.1.attention.wv.mindpet_delta_lora_a', 'model.layers.1.attention.wv.mindpet_delta_lora_b', 'model.layers.2.attention.wq.mindpet_delta_lora_a', 'model.layers.2.attention.wq.mindpet_delta_lora_b', 'model.layers.2.attention.wv.mindpet_delta_lora_a', 'model.layers.2.attention.wv.mindpet_delta_lora_b', 'model.layers.3.attention.wq.mindpet_delta_lora_a', 'model.layers.3.attention.wq.mindpet_delta_lora_b', 'model.layers.3.attention.wv.mindpet_delta_lora_a', 'model.layers.3.attention.wv.mindpet_delta_lora_b', 'model.layers.4.attention.wq.mindpet_delta_lora_a', 'model.layers.4.attention.wq.mindpet_delta_lora_b', 'model.layers.4.attention.wv.mindpet_delta_lora_a', 'model.layers.4.attention.wv.mindpet_delta_lora_b', 'model.layers.5.attention.wq.mindpet_delta_lora_a', 'model.layers.5.attention.wq.mindpet_delta_lora_b', 'model.layers.5.attention.wv.mindpet_delta_lora_a', 'model.layers.5.attention.wv.mindpet_delta_lora_b', 'model.layers.6.attention.wq.mindpet_delta_lora_a', 'model.layers.6.attention.wq.mindpet_delta_lora_b', 'model.layers.6.attention.wv.mindpet_delta_lora_a', 'model.layers.6.attention.wv.mindpet_delta_lora_b', 'model.layers.7.attention.wq.mindpet_delta_lora_a', 'model.layers.7.attention.wq.mindpet_delta_lora_b', 'model.layers.7.attention.wv.mindpet_delta_lora_a', 'model.layers.7.attention.wv.mindpet_delta_lora_b', 'model.layers.8.attention.wq.mindpet_delta_lora_a', 'model.layers.8.attention.wq.mindpet_delta_lora_b', 'model.layers.8.attention.wv.mindpet_delta_lora_a', 'model.layers.8.attention.wv.mindpet_delta_lora_b', 'model.layers.9.attention.wq.mindpet_delta_lora_a', 'model.layers.9.attention.wq.mindpet_delta_lora_b', 'model.layers.9.attention.wv.mindpet_delta_lora_a', 'model.layers.9.attention.wv.mindpet_delta_lora_b', 'model.layers.10.attention.wq.mindpet_delta_lora_a', 'model.layers.10.attention.wq.mindpet_delta_lora_b', 'model.layers.10.attention.wv.mindpet_delta_lora_a', 'model.layers.10.attention.wv.mindpet_delta_lora_b', 'model.layers.11.attention.wq.mindpet_delta_lora_a', 'model.layers.11.attention.wq.mindpet_delta_lora_b', 'model.layers.11.attention.wv.mindpet_delta_lora_a', 'model.layers.11.attention.wv.mindpet_delta_lora_b', 'model.layers.12.attention.wq.mindpet_delta_lora_a', 'model.layers.12.attention.wq.mindpet_delta_lora_b', 'model.layers.12.attention.wv.mindpet_delta_lora_a', 'model.layers.12.attention.wv.mindpet_delta_lora_b', 'model.layers.13.attention.wq.mindpet_delta_lora_a', 'model.layers.13.attention.wq.mindpet_delta_lora_b', 'model.layers.13.attention.wv.mindpet_delta_lora_a', 'model.layers.13.attention.wv.mindpet_delta_lora_b', 'model.layers.14.attention.wq.mindpet_delta_lora_a', 'model.layers.14.attention.wq.mindpet_delta_lora_b', 'model.layers.14.attention.wv.mindpet_delta_lora_a', 'model.layers.14.attention.wv.mindpet_delta_lora_b', 'model.layers.15.attention.wq.mindpet_delta_lora_a', 'model.layers.15.attention.wq.mindpet_delta_lora_b', 'model.layers.15.attention.wv.mindpet_delta_lora_a', 'model.layers.15.attention.wv.mindpet_delta_lora_b', 'model.layers.16.attention.wq.mindpet_delta_lora_a', 'model.layers.16.attention.wq.mindpet_delta_lora_b', 'model.layers.16.attention.wv.mindpet_delta_lora_a', 'model.layers.16.attention.wv.mindpet_delta_lora_b', 'model.layers.17.attention.wq.mindpet_delta_lora_a', 'model.layers.17.attention.wq.mindpet_delta_lora_b', 'model.layers.17.attention.wv.mindpet_delta_lora_a', 'model.layers.17.attention.wv.mindpet_delta_lora_b', 'model.layers.18.attention.wq.mindpet_delta_lora_a', 'model.layers.18.attention.wq.mindpet_delta_lora_b', 'model.layers.18.attention.wv.mindpet_delta_lora_a', 'model.layers.18.attention.wv.mindpet_delta_lora_b', 'model.layers.19.attention.wq.mindpet_delta_lora_a', 'model.layers.19.attention.wq.mindpet_delta_lora_b', 'model.layers.19.attention.wv.mindpet_delta_lora_a', 'model.layers.19.attention.wv.mindpet_delta_lora_b', 'model.layers.20.attention.wq.mindpet_delta_lora_a', 'model.layers.20.attention.wq.mindpet_delta_lora_b', 'model.layers.20.attention.wv.mindpet_delta_lora_a', 'model.layers.20.attention.wv.mindpet_delta_lora_b', 'model.layers.21.attention.wq.mindpet_delta_lora_a', 'model.layers.21.attention.wq.mindpet_delta_lora_b', 'model.layers.21.attention.wv.mindpet_delta_lora_a', 'model.layers.21.attention.wv.mindpet_delta_lora_b', 'model.layers.22.attention.wq.mindpet_delta_lora_a', 'model.layers.22.attention.wq.mindpet_delta_lora_b', 'model.layers.22.attention.wv.mindpet_delta_lora_a', 'model.layers.22.attention.wv.mindpet_delta_lora_b', 'model.layers.23.attention.wq.mindpet_delta_lora_a', 'model.layers.23.attention.wq.mindpet_delta_lora_b', 'model.layers.23.attention.wv.mindpet_delta_lora_a', 'model.layers.23.attention.wv.mindpet_delta_lora_b', 'model.layers.24.attention.wq.mindpet_delta_lora_a', 'model.layers.24.attention.wq.mindpet_delta_lora_b', 'model.layers.24.attention.wv.mindpet_delta_lora_a', 'model.layers.24.attention.wv.mindpet_delta_lora_b', 'model.layers.25.attention.wq.mindpet_delta_lora_a', 'model.layers.25.attention.wq.mindpet_delta_lora_b', 'model.layers.25.attention.wv.mindpet_delta_lora_a', 'model.layers.25.attention.wv.mindpet_delta_lora_b', 'model.layers.26.attention.wq.mindpet_delta_lora_a', 'model.layers.26.attention.wq.mindpet_delta_lora_b', 'model.layers.26.attention.wv.mindpet_delta_lora_a', 'model.layers.26.attention.wv.mindpet_delta_lora_b', 'model.layers.27.attention.wq.mindpet_delta_lora_a', 'model.layers.27.attention.wq.mindpet_delta_lora_b', 'model.layers.27.attention.wv.mindpet_delta_lora_a', 'model.layers.27.attention.wv.mindpet_delta_lora_b', 'model.layers.28.attention.wq.mindpet_delta_lora_a', 'model.layers.28.attention.wq.mindpet_delta_lora_b', 'model.layers.28.attention.wv.mindpet_delta_lora_a', 'model.layers.28.attention.wv.mindpet_delta_lora_b', 'model.layers.29.attention.wq.mindpet_delta_lora_a', 'model.layers.29.attention.wq.mindpet_delta_lora_b', 'model.layers.29.attention.wv.mindpet_delta_lora_a', 'model.layers.29.attention.wv.mindpet_delta_lora_b', 'model.layers.30.attention.wq.mindpet_delta_lora_a', 'model.layers.30.attention.wq.mindpet_delta_lora_b', 'model.layers.30.attention.wv.mindpet_delta_lora_a', 'model.layers.30.attention.wv.mindpet_delta_lora_b', 'model.layers.31.attention.wq.mindpet_delta_lora_a', 'model.layers.31.attention.wq.mindpet_delta_lora_b', 'model.layers.31.attention.wv.mindpet_delta_lora_a', 'model.layers.31.attention.wv.mindpet_delta_lora_b'] are not loaded. +2024-07-30 02:17:05,406 - mindformers[mindformers/trainer/utils.py:767] - INFO - Network parameters are not loaded: (['model.layers.0.attention.wq.mindpet_delta_lora_a', 'model.layers.0.attention.wq.mindpet_delta_lora_b', 'model.layers.0.attention.wv.mindpet_delta_lora_a', 'model.layers.0.attention.wv.mindpet_delta_lora_b', 'model.layers.1.attention.wq.mindpet_delta_lora_a', 'model.layers.1.attention.wq.mindpet_delta_lora_b', 'model.layers.1.attention.wv.mindpet_delta_lora_a', 'model.layers.1.attention.wv.mindpet_delta_lora_b', 'model.layers.2.attention.wq.mindpet_delta_lora_a', 'model.layers.2.attention.wq.mindpet_delta_lora_b', 'model.layers.2.attention.wv.mindpet_delta_lora_a', 'model.layers.2.attention.wv.mindpet_delta_lora_b', 'model.layers.3.attention.wq.mindpet_delta_lora_a', 'model.layers.3.attention.wq.mindpet_delta_lora_b', 'model.layers.3.attention.wv.mindpet_delta_lora_a', 'model.layers.3.attention.wv.mindpet_delta_lora_b', 'model.layers.4.attention.wq.mindpet_delta_lora_a', 'model.layers.4.attention.wq.mindpet_delta_lora_b', 'model.layers.4.attention.wv.mindpet_delta_lora_a', 'model.layers.4.attention.wv.mindpet_delta_lora_b', 'model.layers.5.attention.wq.mindpet_delta_lora_a', 'model.layers.5.attention.wq.mindpet_delta_lora_b', 'model.layers.5.attention.wv.mindpet_delta_lora_a', 'model.layers.5.attention.wv.mindpet_delta_lora_b', 'model.layers.6.attention.wq.mindpet_delta_lora_a', 'model.layers.6.attention.wq.mindpet_delta_lora_b', 'model.layers.6.attention.wv.mindpet_delta_lora_a', 'model.layers.6.attention.wv.mindpet_delta_lora_b', 'model.layers.7.attention.wq.mindpet_delta_lora_a', 'model.layers.7.attention.wq.mindpet_delta_lora_b', 'model.layers.7.attention.wv.mindpet_delta_lora_a', 'model.layers.7.attention.wv.mindpet_delta_lora_b', 'model.layers.8.attention.wq.mindpet_delta_lora_a', 'model.layers.8.attention.wq.mindpet_delta_lora_b', 'model.layers.8.attention.wv.mindpet_delta_lora_a', 'model.layers.8.attention.wv.mindpet_delta_lora_b', 'model.layers.9.attention.wq.mindpet_delta_lora_a', 'model.layers.9.attention.wq.mindpet_delta_lora_b', 'model.layers.9.attention.wv.mindpet_delta_lora_a', 'model.layers.9.attention.wv.mindpet_delta_lora_b', 'model.layers.10.attention.wq.mindpet_delta_lora_a', 'model.layers.10.attention.wq.mindpet_delta_lora_b', 'model.layers.10.attention.wv.mindpet_delta_lora_a', 'model.layers.10.attention.wv.mindpet_delta_lora_b', 'model.layers.11.attention.wq.mindpet_delta_lora_a', 'model.layers.11.attention.wq.mindpet_delta_lora_b', 'model.layers.11.attention.wv.mindpet_delta_lora_a', 'model.layers.11.attention.wv.mindpet_delta_lora_b', 'model.layers.12.attention.wq.mindpet_delta_lora_a', 'model.layers.12.attention.wq.mindpet_delta_lora_b', 'model.layers.12.attention.wv.mindpet_delta_lora_a', 'model.layers.12.attention.wv.mindpet_delta_lora_b', 'model.layers.13.attention.wq.mindpet_delta_lora_a', 'model.layers.13.attention.wq.mindpet_delta_lora_b', 'model.layers.13.attention.wv.mindpet_delta_lora_a', 'model.layers.13.attention.wv.mindpet_delta_lora_b', 'model.layers.14.attention.wq.mindpet_delta_lora_a', 'model.layers.14.attention.wq.mindpet_delta_lora_b', 'model.layers.14.attention.wv.mindpet_delta_lora_a', 'model.layers.14.attention.wv.mindpet_delta_lora_b', 'model.layers.15.attention.wq.mindpet_delta_lora_a', 'model.layers.15.attention.wq.mindpet_delta_lora_b', 'model.layers.15.attention.wv.mindpet_delta_lora_a', 'model.layers.15.attention.wv.mindpet_delta_lora_b', 'model.layers.16.attention.wq.mindpet_delta_lora_a', 'model.layers.16.attention.wq.mindpet_delta_lora_b', 'model.layers.16.attention.wv.mindpet_delta_lora_a', 'model.layers.16.attention.wv.mindpet_delta_lora_b', 'model.layers.17.attention.wq.mindpet_delta_lora_a', 'model.layers.17.attention.wq.mindpet_delta_lora_b', 'model.layers.17.attention.wv.mindpet_delta_lora_a', 'model.layers.17.attention.wv.mindpet_delta_lora_b', 'model.layers.18.attention.wq.mindpet_delta_lora_a', 'model.layers.18.attention.wq.mindpet_delta_lora_b', 'model.layers.18.attention.wv.mindpet_delta_lora_a', 'model.layers.18.attention.wv.mindpet_delta_lora_b', 'model.layers.19.attention.wq.mindpet_delta_lora_a', 'model.layers.19.attention.wq.mindpet_delta_lora_b', 'model.layers.19.attention.wv.mindpet_delta_lora_a', 'model.layers.19.attention.wv.mindpet_delta_lora_b', 'model.layers.20.attention.wq.mindpet_delta_lora_a', 'model.layers.20.attention.wq.mindpet_delta_lora_b', 'model.layers.20.attention.wv.mindpet_delta_lora_a', 'model.layers.20.attention.wv.mindpet_delta_lora_b', 'model.layers.21.attention.wq.mindpet_delta_lora_a', 'model.layers.21.attention.wq.mindpet_delta_lora_b', 'model.layers.21.attention.wv.mindpet_delta_lora_a', 'model.layers.21.attention.wv.mindpet_delta_lora_b', 'model.layers.22.attention.wq.mindpet_delta_lora_a', 'model.layers.22.attention.wq.mindpet_delta_lora_b', 'model.layers.22.attention.wv.mindpet_delta_lora_a', 'model.layers.22.attention.wv.mindpet_delta_lora_b', 'model.layers.23.attention.wq.mindpet_delta_lora_a', 'model.layers.23.attention.wq.mindpet_delta_lora_b', 'model.layers.23.attention.wv.mindpet_delta_lora_a', 'model.layers.23.attention.wv.mindpet_delta_lora_b', 'model.layers.24.attention.wq.mindpet_delta_lora_a', 'model.layers.24.attention.wq.mindpet_delta_lora_b', 'model.layers.24.attention.wv.mindpet_delta_lora_a', 'model.layers.24.attention.wv.mindpet_delta_lora_b', 'model.layers.25.attention.wq.mindpet_delta_lora_a', 'model.layers.25.attention.wq.mindpet_delta_lora_b', 'model.layers.25.attention.wv.mindpet_delta_lora_a', 'model.layers.25.attention.wv.mindpet_delta_lora_b', 'model.layers.26.attention.wq.mindpet_delta_lora_a', 'model.layers.26.attention.wq.mindpet_delta_lora_b', 'model.layers.26.attention.wv.mindpet_delta_lora_a', 'model.layers.26.attention.wv.mindpet_delta_lora_b', 'model.layers.27.attention.wq.mindpet_delta_lora_a', 'model.layers.27.attention.wq.mindpet_delta_lora_b', 'model.layers.27.attention.wv.mindpet_delta_lora_a', 'model.layers.27.attention.wv.mindpet_delta_lora_b', 'model.layers.28.attention.wq.mindpet_delta_lora_a', 'model.layers.28.attention.wq.mindpet_delta_lora_b', 'model.layers.28.attention.wv.mindpet_delta_lora_a', 'model.layers.28.attention.wv.mindpet_delta_lora_b', 'model.layers.29.attention.wq.mindpet_delta_lora_a', 'model.layers.29.attention.wq.mindpet_delta_lora_b', 'model.layers.29.attention.wv.mindpet_delta_lora_a', 'model.layers.29.attention.wv.mindpet_delta_lora_b', 'model.layers.30.attention.wq.mindpet_delta_lora_a', 'model.layers.30.attention.wq.mindpet_delta_lora_b', 'model.layers.30.attention.wv.mindpet_delta_lora_a', 'model.layers.30.attention.wv.mindpet_delta_lora_b', 'model.layers.31.attention.wq.mindpet_delta_lora_a', 'model.layers.31.attention.wq.mindpet_delta_lora_b', 'model.layers.31.attention.wv.mindpet_delta_lora_a', 'model.layers.31.attention.wv.mindpet_delta_lora_b'], []) +2024-07-30 02:17:05,407 - mindformers[mindformers/trainer/base_trainer.py:770] - INFO - .........Starting Training Model.......... +2024-07-30 02:17:05,407 - mindformers[mindformers/trainer/base_trainer.py:773] - INFO - .........Model Compiling, Please Wait a Moment........... +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:17:05.408.619 [mindspore/train/model.py:1120] For MFLossMonitor callback, {'epoch_end', 'epoch_begin', 'step_begin', 'step_end'} methods may not be supported in later version, Use methods prefixed with 'on_train' or 'on_eval' instead when using customized callbacks. +[WARNING] ME(978972:281473204543504,MainProcess):2024-07-30-02:17:05.408.767 [mindspore/train/model.py:1120] For Local2ObsMonitor callback, {'epoch_end', 'step_end'} methods may not be supported in later version, Use methods prefixed with 'on_train' or 'on_eval' instead when using customized callbacks. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.823.166 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/31-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.823.928 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/30-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.824.615 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/29-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.825.293 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/28-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.825.960 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/27-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.826.627 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/26-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.827.313 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/25-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.827.979 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/24-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.828.669 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/23-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.829.336 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/22-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.830.001 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/21-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.830.659 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/20-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.831.313 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/19-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.831.959 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/18-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.832.644 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/17-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.833.301 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/16-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.833.952 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/15-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.834.592 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/14-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.835.228 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/13-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.835.876 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/12-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.836.519 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/11-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.837.176 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/10-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.837.840 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/9-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.838.496 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/8-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.839.148 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/7-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.839.794 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/6-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.840.444 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/5-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.841.113 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/4-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.841.768 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/3-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.842.409 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/2-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.843.072 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/1-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.843.716 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/0-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.844.164 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/0-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.844.906 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/1-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.845.639 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/2-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.846.364 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/3-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.847.081 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/4-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.847.817 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/5-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.848.597 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/6-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.849.343 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/7-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.850.088 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/8-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.850.835 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/9-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.851.572 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/10-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.852.313 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/11-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.853.064 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/12-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.853.793 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/13-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.854.533 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/14-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.855.251 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/15-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.855.961 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/16-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.856.708 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/17-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.857.414 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/18-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.858.116 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/19-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.858.821 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/20-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.859.518 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/21-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.860.218 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/22-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.860.929 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/23-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.861.625 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/24-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.862.310 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/25-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.863.006 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/26-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.863.697 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/27-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.864.386 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/28-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.865.080 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/29-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.865.732 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/30-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:33.866.344 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/31-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978972,ffff965ee010,python):2024-07-30-02:17:36.496.246 [mindspore/ccsrc/frontend/parallel/graph_util/graph_utils.cc:68] GetTensorRedistributionFromCNode] Default/network-MFTrainOneStepCell/clip_grad_norm-ClipGradNorm/Sqrt-op0 has no OperatorInfo. +- \ | 2024-07-30 02:26:19,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2/ 3125], loss: 1.392, per_step_time: 275957ms, lr: 3.558719e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:19,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.0% | | 0.02899 samples/s/p 29 days, 22:29:08 } +2024-07-30 02:26:23,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 4/ 3125], loss: 1.327, per_step_time: 1419ms, lr: 1.0676156e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:23,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.0% | | 5.63518 samples/s/p 3:41:43 } +2024-07-30 02:26:26,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 6/ 3125], loss: 1.193, per_step_time: 1413ms, lr: 1.7793593e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:26,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.66153 samples/s/p 3:40:38 } +2024-07-30 02:26:28,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 8/ 3125], loss: 1.399, per_step_time: 1415ms, lr: 2.4911031e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:28,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.65030 samples/s/p 3:41:02 } +2024-07-30 02:26:31,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 10/ 3125], loss: 1.360, per_step_time: 1414ms, lr: 3.202847e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:31,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.65512 samples/s/p 3:40:48 } +2024-07-30 02:26:34,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 12/ 3125], loss: 1.379, per_step_time: 1413ms, lr: 3.9145905e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:34,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.65892 samples/s/p 3:40:36 } +2024-07-30 02:26:37,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 14/ 3125], loss: 1.350, per_step_time: 1413ms, lr: 4.6263344e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:37,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.65858 samples/s/p 3:40:34 } +2024-07-30 02:26:40,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 16/ 3125], loss: 1.343, per_step_time: 1413ms, lr: 5.3380785e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:40,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.65966 samples/s/p 3:40:29 } +2024-07-30 02:26:43,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 18/ 3125], loss: 1.049, per_step_time: 1413ms, lr: 6.049822e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:43,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.65852 samples/s/p 3:40:28 } +2024-07-30 02:26:45,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 20/ 3125], loss: 1.286, per_step_time: 1413ms, lr: 6.7615656e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:45,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.65828 samples/s/p 3:40:26 } +2024-07-30 02:26:48,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 22/ 3125], loss: 1.170, per_step_time: 1413ms, lr: 7.473309e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:48,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.65979 samples/s/p 3:40:20 } +2024-07-30 02:26:51,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 24/ 3125], loss: 1.197, per_step_time: 1413ms, lr: 8.185053e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:51,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.66011 samples/s/p 3:40:16 } +2024-07-30 02:26:54,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 26/ 3125], loss: 1.367, per_step_time: 1413ms, lr: 8.896797e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:54,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.65834 samples/s/p 3:40:18 } +2024-07-30 02:26:57,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 28/ 3125], loss: 1.430, per_step_time: 1414ms, lr: 9.608541e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:57,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.65756 samples/s/p 3:40:17 } +2024-07-30 02:27:00,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 30/ 3125], loss: 1.447, per_step_time: 1412ms, lr: 1.0320284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:00,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.66223 samples/s/p 3:40:03 } +2024-07-30 02:27:02,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 32/ 3125], loss: 1.653, per_step_time: 1415ms, lr: 1.1032029e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:02,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.65249 samples/s/p 3:40:23 } +2024-07-30 02:27:05,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 34/ 3125], loss: 1.188, per_step_time: 1424ms, lr: 1.1743772e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:05,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.61491 samples/s/p 3:41:48 } +2024-07-30 02:27:08,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 36/ 3125], loss: 1.306, per_step_time: 1414ms, lr: 1.2455515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:08,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.65610 samples/s/p 3:40:09 } +2024-07-30 02:27:11,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 38/ 3125], loss: 1.332, per_step_time: 1413ms, lr: 1.3167258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:11,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.66052 samples/s/p 3:39:55 } +2024-07-30 02:27:14,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 40/ 3125], loss: 1.375, per_step_time: 1416ms, lr: 1.3879004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:14,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.64910 samples/s/p 3:40:19 } +2024-07-30 02:27:17,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 42/ 3125], loss: 1.420, per_step_time: 1413ms, lr: 1.4590747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:17,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.65926 samples/s/p 3:39:53 } +2024-07-30 02:27:19,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 44/ 3125], loss: 1.437, per_step_time: 1413ms, lr: 1.530249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:19,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.66138 samples/s/p 3:39:45 } +2024-07-30 02:27:22,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 46/ 3125], loss: 1.287, per_step_time: 1412ms, lr: 1.6014234e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:22,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.66212 samples/s/p 3:39:40 } +2024-07-30 02:27:25,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 48/ 3125], loss: 1.380, per_step_time: 1414ms, lr: 1.6725978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:25,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.65478 samples/s/p 3:39:55 } +2024-07-30 02:27:28,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 50/ 3125], loss: 1.100, per_step_time: 1413ms, lr: 1.7437721e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:28,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.65849 samples/s/p 3:39:43 } +2024-07-30 02:27:31,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 52/ 3125], loss: 1.361, per_step_time: 1413ms, lr: 1.8149465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:31,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.65843 samples/s/p 3:39:41 } +2024-07-30 02:27:34,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 54/ 3125], loss: 1.508, per_step_time: 1413ms, lr: 1.886121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:34,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.65874 samples/s/p 3:39:37 } +2024-07-30 02:27:36,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 56/ 3125], loss: 1.341, per_step_time: 1412ms, lr: 1.9572954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:36,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.66241 samples/s/p 3:39:26 } +2024-07-30 02:27:39,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 58/ 3125], loss: 1.275, per_step_time: 1413ms, lr: 2.0284697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:39,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.66084 samples/s/p 3:39:26 } +2024-07-30 02:27:42,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 60/ 3125], loss: 1.126, per_step_time: 1412ms, lr: 2.099644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:42,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.66196 samples/s/p 3:39:21 } +2024-07-30 02:27:45,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 62/ 3125], loss: 1.619, per_step_time: 1413ms, lr: 2.1708183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:45,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.65868 samples/s/p 3:39:26 } +2024-07-30 02:27:48,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 64/ 3125], loss: 1.251, per_step_time: 1415ms, lr: 2.2419927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:48,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.65067 samples/s/p 3:39:42 } +2024-07-30 02:27:51,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 66/ 3125], loss: 1.324, per_step_time: 1413ms, lr: 2.3131672e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:51,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.66050 samples/s/p 3:39:16 } +2024-07-30 02:27:53,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 68/ 3125], loss: 1.160, per_step_time: 1413ms, lr: 2.3843415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:53,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.65915 samples/s/p 3:39:16 } +2024-07-30 02:27:56,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 70/ 3125], loss: 1.056, per_step_time: 1413ms, lr: 2.4555159e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:56,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.65839 samples/s/p 3:39:15 } +2024-07-30 02:27:59,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 72/ 3125], loss: 1.486, per_step_time: 1415ms, lr: 2.5266902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:59,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.65280 samples/s/p 3:39:25 } +2024-07-30 02:28:02,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 74/ 3125], loss: 1.359, per_step_time: 1414ms, lr: 2.5978647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:02,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.65670 samples/s/p 3:39:13 } +2024-07-30 02:28:05,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 76/ 3125], loss: 1.356, per_step_time: 1415ms, lr: 2.669039e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:05,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.65177 samples/s/p 3:39:22 } +2024-07-30 02:28:08,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 78/ 3125], loss: 1.349, per_step_time: 1414ms, lr: 2.7402134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:08,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.65675 samples/s/p 3:39:08 } +2024-07-30 02:28:10,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 80/ 3125], loss: 1.630, per_step_time: 1413ms, lr: 2.8113877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:10,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.66127 samples/s/p 3:38:54 } +2024-07-30 02:28:13,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 82/ 3125], loss: 1.549, per_step_time: 1414ms, lr: 2.8825623e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:13,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.65744 samples/s/p 3:39:00 } +2024-07-30 02:28:16,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 84/ 3125], loss: 1.097, per_step_time: 1413ms, lr: 2.9537364e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:16,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.65868 samples/s/p 3:38:55 } +2024-07-30 02:28:19,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 86/ 3125], loss: 1.357, per_step_time: 1413ms, lr: 3.024911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:19,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.66133 samples/s/p 3:38:46 } +2024-07-30 02:28:22,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 88/ 3125], loss: 1.011, per_step_time: 1416ms, lr: 3.0960855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:22,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.64613 samples/s/p 3:39:18 } +2024-07-30 02:28:25,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 90/ 3125], loss: 0.990, per_step_time: 1413ms, lr: 3.1672596e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:25,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.66095 samples/s/p 3:38:41 } +2024-07-30 02:28:27,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 92/ 3125], loss: 1.119, per_step_time: 1414ms, lr: 3.2384341e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:27,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.65594 samples/s/p 3:38:50 } +2024-07-30 02:28:30,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 94/ 3125], loss: 1.152, per_step_time: 1413ms, lr: 3.3096082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:30,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.65821 samples/s/p 3:38:42 } +2024-07-30 02:28:33,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 96/ 3125], loss: 1.270, per_step_time: 1414ms, lr: 3.3807828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:33,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.65628 samples/s/p 3:38:43 } +2024-07-30 02:28:36,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 98/ 3125], loss: 1.162, per_step_time: 1413ms, lr: 3.4519574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:36,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.66032 samples/s/p 3:38:31 } +2024-07-30 02:28:39,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 100/ 3125], loss: 0.916, per_step_time: 1412ms, lr: 3.5231315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:39,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.66211 samples/s/p 3:38:24 } +2024-07-30 02:28:42,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 102/ 3125], loss: 1.030, per_step_time: 1414ms, lr: 3.594306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:42,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.65590 samples/s/p 3:38:36 } +2024-07-30 02:28:44,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 104/ 3125], loss: 1.432, per_step_time: 1415ms, lr: 3.6654803e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:44,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.65283 samples/s/p 3:38:40 } +2024-07-30 02:28:47,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 106/ 3125], loss: 1.152, per_step_time: 1413ms, lr: 3.7366547e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:47,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.66024 samples/s/p 3:38:20 } +2024-07-30 02:28:50,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 108/ 3125], loss: 1.291, per_step_time: 1413ms, lr: 3.807829e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:50,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.65942 samples/s/p 3:38:19 } +2024-07-30 02:28:53,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 110/ 3125], loss: 1.239, per_step_time: 1413ms, lr: 3.8790035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:53,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.66042 samples/s/p 3:38:14 } +2024-07-30 02:28:56,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 112/ 3125], loss: 1.071, per_step_time: 1415ms, lr: 3.950178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:56,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.65328 samples/s/p 3:38:28 } +2024-07-30 02:28:59,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 114/ 3125], loss: 1.148, per_step_time: 1414ms, lr: 4.021352e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:59,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.65752 samples/s/p 3:38:15 } +2024-07-30 02:29:02,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 116/ 3125], loss: 1.301, per_step_time: 1413ms, lr: 4.0925265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:02,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.66131 samples/s/p 3:38:03 } +2024-07-30 02:29:04,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 118/ 3125], loss: 0.982, per_step_time: 1413ms, lr: 4.163701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:04,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.65802 samples/s/p 3:38:08 } +2024-07-30 02:29:07,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 120/ 3125], loss: 1.209, per_step_time: 1414ms, lr: 4.234875e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:07,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.65630 samples/s/p 3:38:09 } +2024-07-30 02:29:10,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 122/ 3125], loss: 0.910, per_step_time: 1414ms, lr: 4.3060495e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:10,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.65624 samples/s/p 3:38:07 } +2024-07-30 02:29:13,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 124/ 3125], loss: 1.276, per_step_time: 1414ms, lr: 4.377224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:13,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.65436 samples/s/p 3:38:08 } +2024-07-30 02:29:16,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 126/ 3125], loss: 1.127, per_step_time: 1414ms, lr: 4.4483986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:16,178 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.65768 samples/s/p 3:37:58 } +2024-07-30 02:29:19,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 128/ 3125], loss: 0.940, per_step_time: 1414ms, lr: 4.519573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:19,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.65771 samples/s/p 3:37:55 } +2024-07-30 02:29:21,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 130/ 3125], loss: 1.026, per_step_time: 1413ms, lr: 4.5907473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:21,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.65940 samples/s/p 3:37:48 } +2024-07-30 02:29:24,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 132/ 3125], loss: 0.990, per_step_time: 1414ms, lr: 4.6619216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:24,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.65635 samples/s/p 3:37:52 } +2024-07-30 02:29:27,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 134/ 3125], loss: 1.413, per_step_time: 1413ms, lr: 4.733096e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:27,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.65977 samples/s/p 3:37:42 } +2024-07-30 02:29:30,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 136/ 3125], loss: 1.120, per_step_time: 1414ms, lr: 4.8042702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:30,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.65731 samples/s/p 3:37:44 } +2024-07-30 02:29:33,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 138/ 3125], loss: 0.952, per_step_time: 1415ms, lr: 4.8754446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:33,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.65344 samples/s/p 3:37:50 } +2024-07-30 02:29:36,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 140/ 3125], loss: 1.111, per_step_time: 1414ms, lr: 4.9466194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:36,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.65601 samples/s/p 3:37:42 } +2024-07-30 02:29:38,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 142/ 3125], loss: 1.099, per_step_time: 1414ms, lr: 5.0177937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:38,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.65614 samples/s/p 3:37:39 } +2024-07-30 02:29:41,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 144/ 3125], loss: 1.208, per_step_time: 1413ms, lr: 5.0889676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:41,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.65847 samples/s/p 3:37:30 } +2024-07-30 02:29:44,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 146/ 3125], loss: 1.044, per_step_time: 1413ms, lr: 5.160142e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:44,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.65999 samples/s/p 3:37:24 } +2024-07-30 02:29:47,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 148/ 3125], loss: 1.002, per_step_time: 1413ms, lr: 5.2313167e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:47,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.66003 samples/s/p 3:37:21 } +2024-07-30 02:29:50,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 150/ 3125], loss: 1.366, per_step_time: 1413ms, lr: 5.302491e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:50,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.66138 samples/s/p 3:37:15 } +2024-07-30 02:29:53,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 152/ 3125], loss: 0.954, per_step_time: 1413ms, lr: 5.3736658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:53,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.66062 samples/s/p 3:37:14 } +2024-07-30 02:29:55,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 154/ 3125], loss: 0.976, per_step_time: 1413ms, lr: 5.4448396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:55,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.66107 samples/s/p 3:37:10 } +2024-07-30 02:29:58,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 156/ 3125], loss: 1.448, per_step_time: 1415ms, lr: 5.516014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:58,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.65242 samples/s/p 3:37:27 } +2024-07-30 02:30:01,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 158/ 3125], loss: 1.134, per_step_time: 1413ms, lr: 5.5871883e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:01,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.65901 samples/s/p 3:37:09 } +2024-07-30 02:30:04,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 160/ 3125], loss: 1.046, per_step_time: 1413ms, lr: 5.658363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:04,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.65880 samples/s/p 3:37:07 } +2024-07-30 02:30:07,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 162/ 3125], loss: 1.002, per_step_time: 1414ms, lr: 5.7295374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:07,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.65665 samples/s/p 3:37:09 } +2024-07-30 02:30:10,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 164/ 3125], loss: 0.902, per_step_time: 1412ms, lr: 5.8007113e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:10,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.66176 samples/s/p 3:36:55 } +2024-07-30 02:30:12,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 166/ 3125], loss: 1.278, per_step_time: 1413ms, lr: 5.871886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:12,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.65930 samples/s/p 3:36:57 } +2024-07-30 02:30:15,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 168/ 3125], loss: 0.935, per_step_time: 1415ms, lr: 5.9430604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:15,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.65282 samples/s/p 3:37:09 } +2024-07-30 02:30:18,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 170/ 3125], loss: 0.847, per_step_time: 1413ms, lr: 6.0142347e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:18,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.65911 samples/s/p 3:36:52 } +2024-07-30 02:30:21,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 172/ 3125], loss: 0.977, per_step_time: 1413ms, lr: 6.0854086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:21,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.65951 samples/s/p 3:36:48 } +2024-07-30 02:30:24,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 174/ 3125], loss: 1.147, per_step_time: 1413ms, lr: 6.1565834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:24,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.66032 samples/s/p 3:36:44 } +2024-07-30 02:30:27,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 176/ 3125], loss: 0.650, per_step_time: 1413ms, lr: 6.2277577e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:27,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.66024 samples/s/p 3:36:41 } +2024-07-30 02:30:29,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 178/ 3125], loss: 0.672, per_step_time: 1413ms, lr: 6.2989325e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:29,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.65881 samples/s/p 3:36:42 } +2024-07-30 02:30:32,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 180/ 3125], loss: 0.873, per_step_time: 1413ms, lr: 6.370107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:32,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.66007 samples/s/p 3:36:36 } +2024-07-30 02:30:35,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 182/ 3125], loss: 1.075, per_step_time: 1416ms, lr: 6.4412807e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:35,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.64758 samples/s/p 3:37:02 } +2024-07-30 02:30:38,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 184/ 3125], loss: 0.945, per_step_time: 1414ms, lr: 6.512455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:38,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% | | 5.65729 samples/s/p 3:36:37 } +2024-07-30 02:30:41,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 186/ 3125], loss: 0.759, per_step_time: 1415ms, lr: 6.58363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:41,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% | | 5.65139 samples/s/p 3:36:47 } +2024-07-30 02:30:44,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 188/ 3125], loss: 0.980, per_step_time: 1413ms, lr: 6.654804e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:44,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.65948 samples/s/p 3:36:26 } +2024-07-30 02:30:46,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 190/ 3125], loss: 1.129, per_step_time: 1413ms, lr: 6.725979e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:46,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.66145 samples/s/p 3:36:19 } +2024-07-30 02:30:49,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 192/ 3125], loss: 0.925, per_step_time: 1413ms, lr: 6.7971528e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:49,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.65775 samples/s/p 3:36:24 } +2024-07-30 02:30:52,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 194/ 3125], loss: 0.785, per_step_time: 1413ms, lr: 6.868327e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:52,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.66128 samples/s/p 3:36:13 } +2024-07-30 02:30:55,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 196/ 3125], loss: 1.030, per_step_time: 1413ms, lr: 6.9395014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:55,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.66067 samples/s/p 3:36:12 } +2024-07-30 02:30:58,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 198/ 3125], loss: 0.733, per_step_time: 1413ms, lr: 7.010676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:58,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.65970 samples/s/p 3:36:11 } +2024-07-30 02:31:01,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 200/ 3125], loss: 0.688, per_step_time: 1414ms, lr: 7.0818505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:01,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.65407 samples/s/p 3:36:21 } +2024-07-30 02:31:03,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 202/ 3125], loss: 0.663, per_step_time: 1413ms, lr: 7.1530244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:03,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.65816 samples/s/p 3:36:09 } +2024-07-30 02:31:06,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 204/ 3125], loss: 0.988, per_step_time: 1414ms, lr: 7.224199e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:06,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.65388 samples/s/p 3:36:16 } +2024-07-30 02:31:09,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 206/ 3125], loss: 1.034, per_step_time: 1413ms, lr: 7.2953735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:09,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.65827 samples/s/p 3:36:03 } +2024-07-30 02:31:12,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 208/ 3125], loss: 0.978, per_step_time: 1414ms, lr: 7.366548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:12,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.65502 samples/s/p 3:36:08 } +2024-07-30 02:31:15,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 210/ 3125], loss: 0.827, per_step_time: 1413ms, lr: 7.4377217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:15,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.66083 samples/s/p 3:35:52 } +2024-07-30 02:31:18,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 212/ 3125], loss: 0.735, per_step_time: 1413ms, lr: 7.5088965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:18,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.65865 samples/s/p 3:35:54 } +2024-07-30 02:31:20,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 214/ 3125], loss: 0.890, per_step_time: 1414ms, lr: 7.580071e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:20,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.65542 samples/s/p 3:35:58 } +2024-07-30 02:31:23,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 216/ 3125], loss: 0.707, per_step_time: 1413ms, lr: 7.651245e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:23,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.66079 samples/s/p 3:35:43 } +2024-07-30 02:31:26,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 218/ 3125], loss: 0.747, per_step_time: 1413ms, lr: 7.7224195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:26,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.65778 samples/s/p 3:35:47 } +2024-07-30 02:31:29,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 220/ 3125], loss: 0.692, per_step_time: 1413ms, lr: 7.793594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:29,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.65871 samples/s/p 3:35:42 } +2024-07-30 02:31:32,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 222/ 3125], loss: 0.531, per_step_time: 1413ms, lr: 7.864768e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:32,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.65938 samples/s/p 3:35:38 } +2024-07-30 02:31:35,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 224/ 3125], loss: 0.898, per_step_time: 1415ms, lr: 7.935942e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:35,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.65060 samples/s/p 3:35:55 } +2024-07-30 02:31:37,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 226/ 3125], loss: 0.747, per_step_time: 1413ms, lr: 8.007118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:37,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.66127 samples/s/p 3:35:28 } +2024-07-30 02:31:40,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 228/ 3125], loss: 0.643, per_step_time: 1413ms, lr: 8.078292e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:40,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.65913 samples/s/p 3:35:30 } +2024-07-30 02:31:43,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 230/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 8.149465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:43,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.66059 samples/s/p 3:35:24 } +2024-07-30 02:31:46,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 232/ 3125], loss: 0.616, per_step_time: 1413ms, lr: 8.220641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:46,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.65891 samples/s/p 3:35:25 } +2024-07-30 02:31:49,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 234/ 3125], loss: 0.555, per_step_time: 1413ms, lr: 8.291815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:49,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.66053 samples/s/p 3:35:18 } +2024-07-30 02:31:52,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 236/ 3125], loss: 0.715, per_step_time: 1413ms, lr: 8.362989e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:52,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.66089 samples/s/p 3:35:15 } +2024-07-30 02:31:54,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 238/ 3125], loss: 0.645, per_step_time: 1413ms, lr: 8.434164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:54,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.65905 samples/s/p 3:35:16 } +2024-07-30 02:31:57,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 240/ 3125], loss: 0.602, per_step_time: 1413ms, lr: 8.505338e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:57,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.66129 samples/s/p 3:35:08 } +2024-07-30 02:32:00,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 242/ 3125], loss: 0.831, per_step_time: 1413ms, lr: 8.576512e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:00,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.65871 samples/s/p 3:35:11 } +2024-07-30 02:32:03,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 244/ 3125], loss: 0.463, per_step_time: 1413ms, lr: 8.647687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:03,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.65845 samples/s/p 3:35:09 } +2024-07-30 02:32:06,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 246/ 3125], loss: 0.654, per_step_time: 1413ms, lr: 8.718861e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:06,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.65893 samples/s/p 3:35:05 } +2024-07-30 02:32:09,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 248/ 3125], loss: 0.650, per_step_time: 1413ms, lr: 8.790035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:09,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.65940 samples/s/p 3:35:01 } +2024-07-30 02:32:11,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 250/ 3125], loss: 0.783, per_step_time: 1414ms, lr: 8.86121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:11,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.65452 samples/s/p 3:35:10 } +2024-07-30 02:32:14,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 252/ 3125], loss: 0.595, per_step_time: 1414ms, lr: 8.932384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:14,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.65742 samples/s/p 3:35:00 } +2024-07-30 02:32:17,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 254/ 3125], loss: 0.493, per_step_time: 1413ms, lr: 9.003558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:17,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.65772 samples/s/p 3:34:57 } +2024-07-30 02:32:20,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 256/ 3125], loss: 0.632, per_step_time: 1413ms, lr: 9.074733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:20,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.66163 samples/s/p 3:34:45 } +2024-07-30 02:32:23,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 258/ 3125], loss: 0.473, per_step_time: 1413ms, lr: 9.145907e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:23,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.65910 samples/s/p 3:34:48 } +2024-07-30 02:32:26,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 260/ 3125], loss: 0.446, per_step_time: 1413ms, lr: 9.217081e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:26,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.65905 samples/s/p 3:34:45 } +2024-07-30 02:32:28,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 262/ 3125], loss: 0.413, per_step_time: 1413ms, lr: 9.288256e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:28,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.66026 samples/s/p 3:34:39 } +2024-07-30 02:32:31,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 264/ 3125], loss: 0.407, per_step_time: 1413ms, lr: 9.359431e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:31,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.65850 samples/s/p 3:34:41 } +2024-07-30 02:32:34,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 266/ 3125], loss: 0.649, per_step_time: 1413ms, lr: 9.430605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:34,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.65917 samples/s/p 3:34:36 } +2024-07-30 02:32:37,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 268/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 9.501779e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:37,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.65575 samples/s/p 3:34:41 } +2024-07-30 02:32:40,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 270/ 3125], loss: 0.578, per_step_time: 1413ms, lr: 9.572954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:40,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.65874 samples/s/p 3:34:32 } +2024-07-30 02:32:43,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 272/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 9.644128e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:43,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.66038 samples/s/p 3:34:25 } +2024-07-30 02:32:45,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 274/ 3125], loss: 0.552, per_step_time: 1412ms, lr: 9.715302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:45,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.66178 samples/s/p 3:34:19 } +2024-07-30 02:32:48,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 276/ 3125], loss: 0.565, per_step_time: 1413ms, lr: 9.786476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:48,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.66106 samples/s/p 3:34:18 } +2024-07-30 02:32:51,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 278/ 3125], loss: 0.510, per_step_time: 1413ms, lr: 9.857651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:51,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.66046 samples/s/p 3:34:16 } +2024-07-30 02:32:54,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 280/ 3125], loss: 0.584, per_step_time: 1413ms, lr: 9.928825e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:54,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.66107 samples/s/p 3:34:12 } +2024-07-30 02:32:57,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 282/ 3125], loss: 0.441, per_step_time: 1413ms, lr: 1e-05, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:57,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.66063 samples/s/p 3:34:10 } +2024-07-30 02:33:00,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 284/ 3125], loss: 0.723, per_step_time: 1413ms, lr: 9.999999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:00,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.66058 samples/s/p 3:34:08 } +2024-07-30 02:33:02,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 286/ 3125], loss: 0.547, per_step_time: 1413ms, lr: 9.999995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:02,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.66144 samples/s/p 3:34:03 } +2024-07-30 02:33:05,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 288/ 3125], loss: 0.553, per_step_time: 1413ms, lr: 9.999989e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:05,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.65804 samples/s/p 3:34:08 } +2024-07-30 02:33:08,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 290/ 3125], loss: 0.653, per_step_time: 1413ms, lr: 9.999981e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:08,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.66171 samples/s/p 3:33:57 } +2024-07-30 02:33:11,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 292/ 3125], loss: 0.515, per_step_time: 1413ms, lr: 9.99997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:11,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.66089 samples/s/p 3:33:56 } +2024-07-30 02:33:14,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 294/ 3125], loss: 0.442, per_step_time: 1413ms, lr: 9.999957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:14,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.66050 samples/s/p 3:33:54 } +2024-07-30 02:33:17,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 296/ 3125], loss: 0.624, per_step_time: 1413ms, lr: 9.9999415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:17,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.65923 samples/s/p 3:33:54 } +2024-07-30 02:33:19,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 298/ 3125], loss: 0.522, per_step_time: 1413ms, lr: 9.999923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:19,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.65852 samples/s/p 3:33:53 } +2024-07-30 02:33:22,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 300/ 3125], loss: 0.537, per_step_time: 1414ms, lr: 9.999903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:22,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.65538 samples/s/p 3:33:57 } +2024-07-30 02:33:25,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 302/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 9.999881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:25,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.65804 samples/s/p 3:33:48 } +2024-07-30 02:33:28,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 304/ 3125], loss: 0.175, per_step_time: 1414ms, lr: 9.999855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:28,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.65511 samples/s/p 3:33:52 } +2024-07-30 02:33:31,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 306/ 3125], loss: 0.318, per_step_time: 1412ms, lr: 9.999828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:31,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.66225 samples/s/p 3:33:33 } +2024-07-30 02:33:34,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 308/ 3125], loss: 0.612, per_step_time: 1413ms, lr: 9.999798e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:34,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.65917 samples/s/p 3:33:37 } +2024-07-30 02:33:36,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 310/ 3125], loss: 0.388, per_step_time: 1413ms, lr: 9.999765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:36,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.66040 samples/s/p 3:33:31 } +2024-07-30 02:33:39,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 312/ 3125], loss: 0.609, per_step_time: 1413ms, lr: 9.9997305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:39,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.65962 samples/s/p 3:33:30 } +2024-07-30 02:33:42,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 314/ 3125], loss: 0.541, per_step_time: 1413ms, lr: 9.999694e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:42,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.65904 samples/s/p 3:33:29 } +2024-07-30 02:33:45,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 316/ 3125], loss: 0.526, per_step_time: 1414ms, lr: 9.999654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:45,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.65770 samples/s/p 3:33:29 } +2024-07-30 02:33:48,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 318/ 3125], loss: 0.440, per_step_time: 1413ms, lr: 9.999613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:48,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.66076 samples/s/p 3:33:19 } +2024-07-30 02:33:51,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 320/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 9.999569e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:51,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.65969 samples/s/p 3:33:19 } +2024-07-30 02:33:53,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 322/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 9.999521e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:53,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.66042 samples/s/p 3:33:14 } +2024-07-30 02:33:56,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 324/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 9.999473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:56,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.65880 samples/s/p 3:33:15 } +2024-07-30 02:33:59,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 326/ 3125], loss: 0.508, per_step_time: 1415ms, lr: 9.999422e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:59,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.65323 samples/s/p 3:33:25 } +2024-07-30 02:34:02,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 328/ 3125], loss: 0.454, per_step_time: 1414ms, lr: 9.999369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:02,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.65727 samples/s/p 3:33:13 } +2024-07-30 02:34:05,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 330/ 3125], loss: 0.249, per_step_time: 1426ms, lr: 9.999312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:05,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.60934 samples/s/p 3:34:59 } +2024-07-30 02:34:08,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 332/ 3125], loss: 0.287, per_step_time: 1414ms, lr: 9.999253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:08,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.65519 samples/s/p 3:33:12 } +2024-07-30 02:34:10,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 334/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 9.999193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:10,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.66080 samples/s/p 3:32:57 } +2024-07-30 02:34:13,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 336/ 3125], loss: 0.487, per_step_time: 1413ms, lr: 9.99913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:13,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.65904 samples/s/p 3:32:58 } +2024-07-30 02:34:16,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 338/ 3125], loss: 0.379, per_step_time: 1413ms, lr: 9.999064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:16,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.66005 samples/s/p 3:32:53 } +2024-07-30 02:34:19,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 340/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 9.998996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:19,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.66024 samples/s/p 3:32:49 } +2024-07-30 02:34:22,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 342/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 9.998925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:22,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.65910 samples/s/p 3:32:49 } +2024-07-30 02:34:25,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 344/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 9.998853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:25,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.65909 samples/s/p 3:32:46 } +2024-07-30 02:34:27,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 346/ 3125], loss: 0.434, per_step_time: 1412ms, lr: 9.998778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:27,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.66327 samples/s/p 3:32:34 } +2024-07-30 02:34:30,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 348/ 3125], loss: 0.441, per_step_time: 1413ms, lr: 9.9987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:30,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.65933 samples/s/p 3:32:40 } +2024-07-30 02:34:33,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 350/ 3125], loss: 0.393, per_step_time: 1416ms, lr: 9.99862e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:33,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.64691 samples/s/p 3:33:05 } +2024-07-30 02:34:36,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 352/ 3125], loss: 0.227, per_step_time: 1414ms, lr: 9.998537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:36,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.65620 samples/s/p 3:32:41 } +2024-07-30 02:34:39,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 354/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 9.998453e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:39,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.66139 samples/s/p 3:32:27 } +2024-07-30 02:34:42,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 356/ 3125], loss: 0.453, per_step_time: 1413ms, lr: 9.998366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:42,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.65809 samples/s/p 3:32:32 } +2024-07-30 02:34:45,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 358/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 9.998276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:45,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.66118 samples/s/p 3:32:22 } +2024-07-30 02:34:47,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 360/ 3125], loss: 0.478, per_step_time: 1414ms, lr: 9.998184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:47,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.65706 samples/s/p 3:32:28 } +2024-07-30 02:34:50,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 362/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 9.99809e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:50,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.65894 samples/s/p 3:32:21 } +2024-07-30 02:34:53,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 364/ 3125], loss: 0.279, per_step_time: 1412ms, lr: 9.997993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:53,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.66190 samples/s/p 3:32:12 } +2024-07-30 02:34:56,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 366/ 3125], loss: 0.439, per_step_time: 1413ms, lr: 9.997894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:56,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.66070 samples/s/p 3:32:11 } +2024-07-30 02:34:59,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 368/ 3125], loss: 0.439, per_step_time: 1413ms, lr: 9.997793e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:59,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.66152 samples/s/p 3:32:07 } +2024-07-30 02:35:02,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 370/ 3125], loss: 0.284, per_step_time: 1425ms, lr: 9.99769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:02,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.61168 samples/s/p 3:33:57 } +2024-07-30 02:35:04,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 372/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 9.997583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:04,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |█ | 5.66039 samples/s/p 3:32:04 } +2024-07-30 02:35:07,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 374/ 3125], loss: 0.374, per_step_time: 1414ms, lr: 9.997474e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:07,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |█ | 5.65554 samples/s/p 3:32:12 } +2024-07-30 02:35:10,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 376/ 3125], loss: 0.395, per_step_time: 1413ms, lr: 9.997363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:10,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.66127 samples/s/p 3:31:56 } +2024-07-30 02:35:13,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 378/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 9.997249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:13,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.65893 samples/s/p 3:31:59 } +2024-07-30 02:35:16,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 380/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 9.997134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:16,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.65734 samples/s/p 3:31:59 } +2024-07-30 02:35:19,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 382/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 9.997016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:19,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.65923 samples/s/p 3:31:52 } +2024-07-30 02:35:21,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 384/ 3125], loss: 0.253, per_step_time: 1414ms, lr: 9.996896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:21,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.65769 samples/s/p 3:31:53 } +2024-07-30 02:35:24,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 386/ 3125], loss: 0.075, per_step_time: 1414ms, lr: 9.996773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:24,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.65593 samples/s/p 3:31:54 } +2024-07-30 02:35:27,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 388/ 3125], loss: 0.596, per_step_time: 1414ms, lr: 9.996647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:27,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.65761 samples/s/p 3:31:47 } +2024-07-30 02:35:30,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 390/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 9.996519e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:30,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.66170 samples/s/p 3:31:35 } +2024-07-30 02:35:33,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 392/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 9.996389e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:33,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.66075 samples/s/p 3:31:35 } +2024-07-30 02:35:36,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 394/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 9.996256e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:36,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.66096 samples/s/p 3:31:31 } +2024-07-30 02:35:38,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 396/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 9.996122e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:38,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.65836 samples/s/p 3:31:34 } +2024-07-30 02:35:41,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 398/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 9.995984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:41,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.65870 samples/s/p 3:31:31 } +2024-07-30 02:35:44,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 400/ 3125], loss: 0.145, per_step_time: 1414ms, lr: 9.995845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:44,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.65538 samples/s/p 3:31:35 } +2024-07-30 02:35:47,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 402/ 3125], loss: 0.443, per_step_time: 1413ms, lr: 9.995703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:47,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.65968 samples/s/p 3:31:23 } +2024-07-30 02:35:50,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 404/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 9.995558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:50,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.65922 samples/s/p 3:31:21 } +2024-07-30 02:35:53,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 406/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 9.995412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:53,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.65778 samples/s/p 3:31:22 } +2024-07-30 02:35:55,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 408/ 3125], loss: 0.248, per_step_time: 1414ms, lr: 9.995262e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:55,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.65566 samples/s/p 3:31:23 } +2024-07-30 02:35:58,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 410/ 3125], loss: 0.428, per_step_time: 1413ms, lr: 9.995111e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:58,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.66057 samples/s/p 3:31:10 } +2024-07-30 02:36:01,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 412/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 9.994957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:01,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.65852 samples/s/p 3:31:11 } +2024-07-30 02:36:04,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 414/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 9.994801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:04,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.66037 samples/s/p 3:31:04 } +2024-07-30 02:36:07,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 416/ 3125], loss: 0.382, per_step_time: 1413ms, lr: 9.994643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:07,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.65927 samples/s/p 3:31:04 } +2024-07-30 02:36:10,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 418/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 9.994482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:10,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.66076 samples/s/p 3:30:58 } +2024-07-30 02:36:12,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 420/ 3125], loss: 0.203, per_step_time: 1412ms, lr: 9.994317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:12,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.66239 samples/s/p 3:30:51 } +2024-07-30 02:36:15,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 422/ 3125], loss: 0.357, per_step_time: 1413ms, lr: 9.994152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:15,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.65793 samples/s/p 3:30:59 } +2024-07-30 02:36:18,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 424/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 9.993983e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:18,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.66037 samples/s/p 3:30:50 } +2024-07-30 02:36:21,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 426/ 3125], loss: 0.266, per_step_time: 1412ms, lr: 9.9938125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:21,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.66266 samples/s/p 3:30:42 } +2024-07-30 02:36:24,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 428/ 3125], loss: 0.408, per_step_time: 1413ms, lr: 9.99364e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:24,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.66036 samples/s/p 3:30:45 } +2024-07-30 02:36:27,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 430/ 3125], loss: 0.458, per_step_time: 1413ms, lr: 9.993465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:27,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.66141 samples/s/p 3:30:39 } +2024-07-30 02:36:29,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 432/ 3125], loss: 0.196, per_step_time: 1414ms, lr: 9.993287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:29,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.65669 samples/s/p 3:30:47 } +2024-07-30 02:36:32,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 434/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 9.993107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:32,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.66005 samples/s/p 3:30:37 } +2024-07-30 02:36:35,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 436/ 3125], loss: 0.404, per_step_time: 1414ms, lr: 9.992924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:35,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.65641 samples/s/p 3:30:42 } +2024-07-30 02:36:38,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 438/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 9.992738e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:38,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.65786 samples/s/p 3:30:36 } +2024-07-30 02:36:41,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 440/ 3125], loss: 0.661, per_step_time: 1414ms, lr: 9.992552e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:41,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.65769 samples/s/p 3:30:34 } +2024-07-30 02:36:44,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 442/ 3125], loss: 0.255, per_step_time: 1415ms, lr: 9.992362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:44,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.65345 samples/s/p 3:30:40 } +2024-07-30 02:36:46,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 444/ 3125], loss: 0.383, per_step_time: 1414ms, lr: 9.99217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:46,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.65727 samples/s/p 3:30:29 } +2024-07-30 02:36:49,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 446/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 9.991976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:49,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.66038 samples/s/p 3:30:19 } +2024-07-30 02:36:52,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 448/ 3125], loss: 0.331, per_step_time: 1415ms, lr: 9.991779e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:52,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.65261 samples/s/p 3:30:34 } +2024-07-30 02:36:55,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 450/ 3125], loss: 0.209, per_step_time: 1412ms, lr: 9.99158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:55,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.66267 samples/s/p 3:30:08 } +2024-07-30 02:36:58,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 452/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 9.991378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:58,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.65878 samples/s/p 3:30:14 } +2024-07-30 02:37:01,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 454/ 3125], loss: 0.512, per_step_time: 1414ms, lr: 9.991173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:01,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.65756 samples/s/p 3:30:14 } +2024-07-30 02:37:03,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 456/ 3125], loss: 0.390, per_step_time: 1414ms, lr: 9.990968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:03,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.65514 samples/s/p 3:30:17 } +2024-07-30 02:37:06,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 458/ 3125], loss: 0.349, per_step_time: 1414ms, lr: 9.990758e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:06,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.65758 samples/s/p 3:30:08 } +2024-07-30 02:37:09,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 460/ 3125], loss: 0.634, per_step_time: 1412ms, lr: 9.990547e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:09,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.66203 samples/s/p 3:29:56 } +2024-07-30 02:37:12,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 462/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 9.990334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:12,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.66164 samples/s/p 3:29:54 } +2024-07-30 02:37:15,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 464/ 3125], loss: 0.291, per_step_time: 1414ms, lr: 9.990118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:15,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.65494 samples/s/p 3:30:06 } +2024-07-30 02:37:18,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 466/ 3125], loss: 0.124, per_step_time: 1413ms, lr: 9.9899e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:18,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.66139 samples/s/p 3:29:49 } +2024-07-30 02:37:20,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 468/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 9.98968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:20,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.66120 samples/s/p 3:29:46 } +2024-07-30 02:37:23,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 470/ 3125], loss: 0.148, per_step_time: 1412ms, lr: 9.989456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:23,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.66176 samples/s/p 3:29:42 } +2024-07-30 02:37:26,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 472/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 9.98923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:26,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.65806 samples/s/p 3:29:48 } +2024-07-30 02:37:29,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 474/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 9.989003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:29,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.66042 samples/s/p 3:29:39 } +2024-07-30 02:37:32,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 476/ 3125], loss: 0.678, per_step_time: 1413ms, lr: 9.988773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:32,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.65941 samples/s/p 3:29:39 } +2024-07-30 02:37:35,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 478/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 9.98854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:35,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.65944 samples/s/p 3:29:36 } +2024-07-30 02:37:37,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 480/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 9.9883055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:37,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.65849 samples/s/p 3:29:35 } +2024-07-30 02:37:40,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 482/ 3125], loss: 0.129, per_step_time: 1414ms, lr: 9.988068e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:40,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.65624 samples/s/p 3:29:37 } +2024-07-30 02:37:43,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 484/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 9.987828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:43,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.65981 samples/s/p 3:29:27 } +2024-07-30 02:37:46,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 486/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 9.987586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:46,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.65870 samples/s/p 3:29:26 } +2024-07-30 02:37:49,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 488/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 9.987341e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:49,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.65894 samples/s/p 3:29:23 } +2024-07-30 02:37:52,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 490/ 3125], loss: 0.480, per_step_time: 1413ms, lr: 9.987094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:52,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.66049 samples/s/p 3:29:17 } +2024-07-30 02:37:54,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 492/ 3125], loss: 0.380, per_step_time: 1414ms, lr: 9.986845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:54,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.65741 samples/s/p 3:29:21 } +2024-07-30 02:37:57,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 494/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 9.986594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:57,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.65829 samples/s/p 3:29:16 } +2024-07-30 02:38:00,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 496/ 3125], loss: 0.252, per_step_time: 1414ms, lr: 9.986339e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:00,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.65659 samples/s/p 3:29:17 } +2024-07-30 02:38:03,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 498/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 9.986084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:03,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.65843 samples/s/p 3:29:10 } +2024-07-30 02:38:06,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 500/ 3125], loss: 0.292, per_step_time: 1414ms, lr: 9.985824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:06,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.65686 samples/s/p 3:29:11 } +2024-07-30 02:38:09,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 502/ 3125], loss: 0.396, per_step_time: 1413ms, lr: 9.985563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:09,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.66026 samples/s/p 3:29:00 } +2024-07-30 02:38:11,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 504/ 3125], loss: 0.282, per_step_time: 1412ms, lr: 9.9853005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:11,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.66321 samples/s/p 3:28:51 } +2024-07-30 02:38:14,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 506/ 3125], loss: 0.261, per_step_time: 1414ms, lr: 9.985034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:14,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.65689 samples/s/p 3:29:02 } +2024-07-30 02:38:17,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 508/ 3125], loss: 0.528, per_step_time: 1413ms, lr: 9.984766e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:17,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.66056 samples/s/p 3:28:51 } +2024-07-30 02:38:20,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 510/ 3125], loss: 0.415, per_step_time: 1414ms, lr: 9.984494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:20,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.65761 samples/s/p 3:28:55 } +2024-07-30 02:38:23,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 512/ 3125], loss: 0.172, per_step_time: 1415ms, lr: 9.984221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:23,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.65334 samples/s/p 3:29:01 } +2024-07-30 02:38:26,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 514/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 9.983946e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:26,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.66011 samples/s/p 3:28:44 } +2024-07-30 02:38:28,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 516/ 3125], loss: 0.139, per_step_time: 1413ms, lr: 9.983668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:28,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.66105 samples/s/p 3:28:39 } +2024-07-30 02:38:31,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 518/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 9.983388e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:31,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.66079 samples/s/p 3:28:36 } +2024-07-30 02:38:34,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 520/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 9.983105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:34,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.65930 samples/s/p 3:28:37 } +2024-07-30 02:38:37,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 522/ 3125], loss: 0.416, per_step_time: 1413ms, lr: 9.98282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:37,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.66010 samples/s/p 3:28:32 } +2024-07-30 02:38:40,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 524/ 3125], loss: 0.506, per_step_time: 1413ms, lr: 9.982533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:40,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.65962 samples/s/p 3:28:31 } +2024-07-30 02:38:43,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 526/ 3125], loss: 0.324, per_step_time: 1412ms, lr: 9.982244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:43,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.66268 samples/s/p 3:28:21 } +2024-07-30 02:38:45,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 528/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 9.981952e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:45,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.66075 samples/s/p 3:28:22 } +2024-07-30 02:38:48,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 530/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 9.981657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:48,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.66059 samples/s/p 3:28:20 } +2024-07-30 02:38:51,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 532/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 9.981361e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:51,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.66027 samples/s/p 3:28:18 } +2024-07-30 02:38:54,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 534/ 3125], loss: 0.335, per_step_time: 1413ms, lr: 9.981061e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:54,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.66055 samples/s/p 3:28:14 } +2024-07-30 02:38:57,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 536/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 9.980759e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:57,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.65998 samples/s/p 3:28:13 } +2024-07-30 02:39:00,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 538/ 3125], loss: 0.295, per_step_time: 1412ms, lr: 9.980456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:00,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.66218 samples/s/p 3:28:05 } +2024-07-30 02:39:02,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 540/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 9.980149e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:02,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.65936 samples/s/p 3:28:09 } +2024-07-30 02:39:05,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 542/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 9.97984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:05,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.66053 samples/s/p 3:28:03 } +2024-07-30 02:39:08,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 544/ 3125], loss: 0.380, per_step_time: 1414ms, lr: 9.979529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:08,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.65607 samples/s/p 3:28:10 } +2024-07-30 02:39:11,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 546/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 9.979216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:11,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.65425 samples/s/p 3:28:11 } +2024-07-30 02:39:14,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 548/ 3125], loss: 0.353, per_step_time: 1413ms, lr: 9.9788995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:14,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.65832 samples/s/p 3:28:00 } +2024-07-30 02:39:17,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 550/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 9.978581e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:17,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.65950 samples/s/p 3:27:54 } +2024-07-30 02:39:19,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 552/ 3125], loss: 0.391, per_step_time: 1415ms, lr: 9.978261e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:19,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.65211 samples/s/p 3:28:08 } +2024-07-30 02:39:22,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 554/ 3125], loss: 0.214, per_step_time: 1414ms, lr: 9.977938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:22,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.65721 samples/s/p 3:27:53 } +2024-07-30 02:39:25,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 556/ 3125], loss: 0.356, per_step_time: 1413ms, lr: 9.9776125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:25,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.66010 samples/s/p 3:27:44 } +2024-07-30 02:39:28,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 558/ 3125], loss: 0.101, per_step_time: 1413ms, lr: 9.977284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:28,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.66130 samples/s/p 3:27:39 } +2024-07-30 02:39:31,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 560/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 9.976954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:31,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.66116 samples/s/p 3:27:36 } +2024-07-30 02:39:34,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 562/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 9.976621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:34,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.66158 samples/s/p 3:27:33 } +2024-07-30 02:39:36,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 564/ 3125], loss: 0.431, per_step_time: 1412ms, lr: 9.976287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:36,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |███ | 5.66173 samples/s/p 3:27:29 } +2024-07-30 02:39:39,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 566/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 9.97595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:39,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |███ | 5.66047 samples/s/p 3:27:29 } +2024-07-30 02:39:42,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 568/ 3125], loss: 0.368, per_step_time: 1412ms, lr: 9.97561e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:42,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.66181 samples/s/p 3:27:24 } +2024-07-30 02:39:45,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 570/ 3125], loss: 0.296, per_step_time: 1414ms, lr: 9.975269e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:45,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.65506 samples/s/p 3:27:36 } +2024-07-30 02:39:48,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 572/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 9.974923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:48,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.65981 samples/s/p 3:27:22 } +2024-07-30 02:39:51,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 574/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 9.974578e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:51,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.66056 samples/s/p 3:27:18 } +2024-07-30 02:39:53,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 576/ 3125], loss: 0.225, per_step_time: 1414ms, lr: 9.974228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:53,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.65587 samples/s/p 3:27:25 } +2024-07-30 02:39:56,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 578/ 3125], loss: 0.401, per_step_time: 1414ms, lr: 9.973876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:56,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.65732 samples/s/p 3:27:19 } +2024-07-30 02:39:59,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 580/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 9.9735225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:59,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.65977 samples/s/p 3:27:11 } +2024-07-30 02:40:02,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 582/ 3125], loss: 0.161, per_step_time: 1414ms, lr: 9.973166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:02,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.65705 samples/s/p 3:27:14 } +2024-07-30 02:40:05,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 584/ 3125], loss: 0.215, per_step_time: 1418ms, lr: 9.972808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:05,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.63970 samples/s/p 3:27:50 } +2024-07-30 02:40:08,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 586/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 9.972447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:08,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.66162 samples/s/p 3:26:59 } +2024-07-30 02:40:10,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 588/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 9.972084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:10,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.65776 samples/s/p 3:27:04 } +2024-07-30 02:40:13,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 590/ 3125], loss: 0.234, per_step_time: 1412ms, lr: 9.971717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:13,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.66247 samples/s/p 3:26:51 } +2024-07-30 02:40:16,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 592/ 3125], loss: 0.297, per_step_time: 1414ms, lr: 9.971349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:16,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.65706 samples/s/p 3:27:00 } +2024-07-30 02:40:19,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 594/ 3125], loss: 0.353, per_step_time: 1413ms, lr: 9.970979e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:19,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.65864 samples/s/p 3:26:54 } +2024-07-30 02:40:22,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 596/ 3125], loss: 0.372, per_step_time: 1414ms, lr: 9.970605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:22,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.65727 samples/s/p 3:26:54 } +2024-07-30 02:40:25,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 598/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 9.970231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:25,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.65985 samples/s/p 3:26:45 } +2024-07-30 02:40:27,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 600/ 3125], loss: 0.290, per_step_time: 1415ms, lr: 9.969853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:27,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.65244 samples/s/p 3:26:59 } +2024-07-30 02:40:30,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 602/ 3125], loss: 0.510, per_step_time: 1413ms, lr: 9.969473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:30,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.65929 samples/s/p 3:26:41 } +2024-07-30 02:40:33,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 604/ 3125], loss: 0.393, per_step_time: 1413ms, lr: 9.96909e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:33,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.65969 samples/s/p 3:26:37 } +2024-07-30 02:40:36,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 606/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 9.968706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:36,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.66126 samples/s/p 3:26:31 } +2024-07-30 02:40:39,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 608/ 3125], loss: 0.149, per_step_time: 1414ms, lr: 9.968318e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:39,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.65756 samples/s/p 3:26:36 } +2024-07-30 02:40:42,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 610/ 3125], loss: 0.314, per_step_time: 1412ms, lr: 9.967929e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:42,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.66244 samples/s/p 3:26:23 } +2024-07-30 02:40:44,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 612/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 9.967536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:44,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.66037 samples/s/p 3:26:25 } +2024-07-30 02:40:47,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 614/ 3125], loss: 0.292, per_step_time: 1413ms, lr: 9.967143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:47,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.65907 samples/s/p 3:26:25 } +2024-07-30 02:40:50,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 616/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 9.966746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:50,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.65971 samples/s/p 3:26:20 } +2024-07-30 02:40:53,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 618/ 3125], loss: 0.285, per_step_time: 1415ms, lr: 9.966347e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:53,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.65187 samples/s/p 3:26:35 } +2024-07-30 02:40:56,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 620/ 3125], loss: 0.511, per_step_time: 1412ms, lr: 9.9659455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:56,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.66190 samples/s/p 3:26:10 } +2024-07-30 02:40:59,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 622/ 3125], loss: 0.245, per_step_time: 1414ms, lr: 9.965543e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:59,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.65627 samples/s/p 3:26:19 } +2024-07-30 02:41:02,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 624/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 9.965136e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:02,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.66051 samples/s/p 3:26:07 } +2024-07-30 02:41:04,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 626/ 3125], loss: 0.162, per_step_time: 1412ms, lr: 9.964728e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:04,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.66199 samples/s/p 3:26:01 } +2024-07-30 02:41:07,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 628/ 3125], loss: 0.399, per_step_time: 1413ms, lr: 9.964317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:07,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.65870 samples/s/p 3:26:06 } +2024-07-30 02:41:10,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 630/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 9.963903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:10,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.66074 samples/s/p 3:25:58 } +2024-07-30 02:41:13,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 632/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 9.963488e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:13,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.65868 samples/s/p 3:26:00 } +2024-07-30 02:41:16,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 634/ 3125], loss: 0.229, per_step_time: 1415ms, lr: 9.96307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:16,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.65169 samples/s/p 3:26:12 } +2024-07-30 02:41:19,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 636/ 3125], loss: 0.381, per_step_time: 1414ms, lr: 9.96265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:19,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.65553 samples/s/p 3:26:01 } +2024-07-30 02:41:21,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 638/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 9.9622275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:21,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.66092 samples/s/p 3:25:47 } +2024-07-30 02:41:24,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 640/ 3125], loss: 0.256, per_step_time: 1412ms, lr: 9.961802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:24,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.66255 samples/s/p 3:25:40 } +2024-07-30 02:41:27,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 642/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 9.961374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:27,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.65907 samples/s/p 3:25:45 } +2024-07-30 02:41:30,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 644/ 3125], loss: 0.269, per_step_time: 1414ms, lr: 9.960944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:30,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.65759 samples/s/p 3:25:45 } +2024-07-30 02:41:33,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 646/ 3125], loss: 0.375, per_step_time: 1414ms, lr: 9.960513e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:33,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.65507 samples/s/p 3:25:48 } +2024-07-30 02:41:36,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 648/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 9.9600775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:36,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.65936 samples/s/p 3:25:36 } +2024-07-30 02:41:38,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 650/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 9.959642e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:38,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.65953 samples/s/p 3:25:33 } +2024-07-30 02:41:41,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 652/ 3125], loss: 0.269, per_step_time: 1414ms, lr: 9.9592025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:41,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.65410 samples/s/p 3:25:42 } +2024-07-30 02:41:44,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 654/ 3125], loss: 0.319, per_step_time: 1414ms, lr: 9.9587605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:44,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.65544 samples/s/p 3:25:36 } +2024-07-30 02:41:47,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 656/ 3125], loss: 0.389, per_step_time: 1414ms, lr: 9.958317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:47,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.65703 samples/s/p 3:25:30 } +2024-07-30 02:41:50,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 658/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 9.95787e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:50,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.65950 samples/s/p 3:25:21 } +2024-07-30 02:41:53,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 660/ 3125], loss: 0.096, per_step_time: 1413ms, lr: 9.957421e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:53,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.66171 samples/s/p 3:25:14 } +2024-07-30 02:41:55,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 662/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 9.95697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:55,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.65902 samples/s/p 3:25:17 } +2024-07-30 02:41:58,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 664/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 9.956517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:58,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.65867 samples/s/p 3:25:15 } +2024-07-30 02:42:01,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 666/ 3125], loss: 0.314, per_step_time: 1412ms, lr: 9.95606e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:01,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.66183 samples/s/p 3:25:05 } +2024-07-30 02:42:04,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 668/ 3125], loss: 0.234, per_step_time: 1414ms, lr: 9.955603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:04,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.65741 samples/s/p 3:25:12 } +2024-07-30 02:42:07,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 670/ 3125], loss: 0.103, per_step_time: 1413ms, lr: 9.955142e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:07,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.66065 samples/s/p 3:25:02 } +2024-07-30 02:42:10,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 672/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 9.95468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:10,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.66116 samples/s/p 3:24:58 } +2024-07-30 02:42:12,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 674/ 3125], loss: 0.503, per_step_time: 1413ms, lr: 9.954214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:12,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.66111 samples/s/p 3:24:55 } +2024-07-30 02:42:15,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 676/ 3125], loss: 0.388, per_step_time: 1415ms, lr: 9.953746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:15,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.65308 samples/s/p 3:25:10 } +2024-07-30 02:42:18,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 678/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 9.953275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:18,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.66138 samples/s/p 3:24:49 } +2024-07-30 02:42:21,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 680/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 9.952803e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:21,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.65925 samples/s/p 3:24:51 } +2024-07-30 02:42:24,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 682/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 9.9523295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:24,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.65784 samples/s/p 3:24:51 } +2024-07-30 02:42:27,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 684/ 3125], loss: 0.480, per_step_time: 1414ms, lr: 9.951851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:27,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.65725 samples/s/p 3:24:50 } +2024-07-30 02:42:29,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 686/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 9.951372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:29,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.65940 samples/s/p 3:24:42 } +2024-07-30 02:42:32,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 688/ 3125], loss: 0.346, per_step_time: 1416ms, lr: 9.950891e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:32,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.64866 samples/s/p 3:25:03 } +2024-07-30 02:42:35,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 690/ 3125], loss: 0.391, per_step_time: 1414ms, lr: 9.950406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:35,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.65581 samples/s/p 3:24:44 } +2024-07-30 02:42:38,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 692/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 9.94992e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:38,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.66001 samples/s/p 3:24:32 } +2024-07-30 02:42:41,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 694/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 9.949431e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:41,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.66109 samples/s/p 3:24:27 } +2024-07-30 02:42:44,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 696/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 9.948939e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:44,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.66070 samples/s/p 3:24:25 } +2024-07-30 02:42:46,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 698/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 9.948445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:46,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.66086 samples/s/p 3:24:22 } +2024-07-30 02:42:49,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 700/ 3125], loss: 0.344, per_step_time: 1413ms, lr: 9.947949e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:49,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.65816 samples/s/p 3:24:25 } +2024-07-30 02:42:52,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 702/ 3125], loss: 0.373, per_step_time: 1416ms, lr: 9.947451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:52,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.64925 samples/s/p 3:24:41 } +2024-07-30 02:42:55,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 704/ 3125], loss: 0.209, per_step_time: 1414ms, lr: 9.946951e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:55,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.65466 samples/s/p 3:24:27 } +2024-07-30 02:42:58,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 706/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 9.946447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:58,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.66146 samples/s/p 3:24:09 } +2024-07-30 02:43:01,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 708/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 9.945942e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:01,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.65865 samples/s/p 3:24:13 } +2024-07-30 02:43:03,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 710/ 3125], loss: 0.420, per_step_time: 1412ms, lr: 9.945434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:03,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.66269 samples/s/p 3:24:01 } +2024-07-30 02:43:06,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 712/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 9.9449235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:06,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.66006 samples/s/p 3:24:04 } +2024-07-30 02:43:09,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 714/ 3125], loss: 0.459, per_step_time: 1412ms, lr: 9.944411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:09,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.66280 samples/s/p 3:23:55 } +2024-07-30 02:43:12,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 716/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 9.943897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:12,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.66163 samples/s/p 3:23:55 } +2024-07-30 02:43:15,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 718/ 3125], loss: 0.225, per_step_time: 1412ms, lr: 9.943379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:15,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.66231 samples/s/p 3:23:51 } +2024-07-30 02:43:18,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 720/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 9.942859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:18,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.66162 samples/s/p 3:23:49 } +2024-07-30 02:43:20,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 722/ 3125], loss: 0.310, per_step_time: 1414ms, lr: 9.942337e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:20,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.65724 samples/s/p 3:23:56 } +2024-07-30 02:43:23,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 724/ 3125], loss: 0.183, per_step_time: 1414ms, lr: 9.941812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:23,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.65401 samples/s/p 3:24:00 } +2024-07-30 02:43:26,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 726/ 3125], loss: 0.421, per_step_time: 1414ms, lr: 9.941286e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:26,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.65529 samples/s/p 3:23:54 } +2024-07-30 02:43:29,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 728/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 9.940757e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:29,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.65983 samples/s/p 3:23:42 } +2024-07-30 02:43:32,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 730/ 3125], loss: 0.255, per_step_time: 1414ms, lr: 9.940226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:32,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.65767 samples/s/p 3:23:44 } +2024-07-30 02:43:35,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 732/ 3125], loss: 0.202, per_step_time: 1414ms, lr: 9.939692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:35,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.65693 samples/s/p 3:23:42 } +2024-07-30 02:43:37,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 734/ 3125], loss: 0.373, per_step_time: 1413ms, lr: 9.9391555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:37,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.66018 samples/s/p 3:23:33 } +2024-07-30 02:43:40,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 736/ 3125], loss: 0.418, per_step_time: 1413ms, lr: 9.938616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:40,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.66065 samples/s/p 3:23:29 } +2024-07-30 02:43:43,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 738/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 9.938076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:43,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.65908 samples/s/p 3:23:29 } +2024-07-30 02:43:46,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 740/ 3125], loss: 0.420, per_step_time: 1413ms, lr: 9.937533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:46,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.66136 samples/s/p 3:23:22 } +2024-07-30 02:43:49,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 742/ 3125], loss: 0.164, per_step_time: 1414ms, lr: 9.936987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:49,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.65674 samples/s/p 3:23:29 } +2024-07-30 02:43:52,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 744/ 3125], loss: 0.265, per_step_time: 1415ms, lr: 9.93644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:52,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.65141 samples/s/p 3:23:37 } +2024-07-30 02:43:54,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 746/ 3125], loss: 0.220, per_step_time: 1415ms, lr: 9.935889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:54,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |███ | 5.65116 samples/s/p 3:23:35 } +2024-07-30 02:43:57,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 748/ 3125], loss: 0.333, per_step_time: 1414ms, lr: 9.9353365e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:57,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |███ | 5.65738 samples/s/p 3:23:19 } +2024-07-30 02:44:00,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 750/ 3125], loss: 0.195, per_step_time: 1414ms, lr: 9.934782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:00,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.65559 samples/s/p 3:23:20 } +2024-07-30 02:44:03,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 752/ 3125], loss: 0.465, per_step_time: 1414ms, lr: 9.934223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:03,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.65690 samples/s/p 3:23:14 } +2024-07-30 02:44:06,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 754/ 3125], loss: 0.249, per_step_time: 1414ms, lr: 9.933664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:06,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.65728 samples/s/p 3:23:11 } +2024-07-30 02:44:09,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 756/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 9.933102e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:09,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.66091 samples/s/p 3:23:00 } +2024-07-30 02:44:11,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 758/ 3125], loss: 0.390, per_step_time: 1413ms, lr: 9.932538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:11,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.66076 samples/s/p 3:22:57 } +2024-07-30 02:44:14,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 760/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 9.931971e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:14,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.66041 samples/s/p 3:22:55 } +2024-07-30 02:44:17,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 762/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 9.931402e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:17,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.65973 samples/s/p 3:22:54 } +2024-07-30 02:44:20,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 764/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 9.93083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:20,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.66016 samples/s/p 3:22:50 } +2024-07-30 02:44:23,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 766/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 9.930256e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:23,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.66153 samples/s/p 3:22:44 } +2024-07-30 02:44:26,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 768/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 9.92968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:26,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.65897 samples/s/p 3:22:47 } +2024-07-30 02:44:28,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 770/ 3125], loss: 0.407, per_step_time: 1420ms, lr: 9.929101e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:28,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.63316 samples/s/p 3:23:40 } +2024-07-30 02:44:31,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 772/ 3125], loss: 0.230, per_step_time: 1421ms, lr: 9.928521e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:31,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.62822 samples/s/p 3:23:48 } +2024-07-30 02:44:34,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 774/ 3125], loss: 0.346, per_step_time: 1417ms, lr: 9.927937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:34,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.64495 samples/s/p 3:23:09 } +2024-07-30 02:44:37,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 776/ 3125], loss: 0.453, per_step_time: 1416ms, lr: 9.927351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:37,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.64848 samples/s/p 3:22:58 } +2024-07-30 02:44:40,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 778/ 3125], loss: 0.332, per_step_time: 1416ms, lr: 9.926764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:40,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.64970 samples/s/p 3:22:53 } +2024-07-30 02:44:43,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 780/ 3125], loss: 0.240, per_step_time: 1416ms, lr: 9.926173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:43,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.64965 samples/s/p 3:22:50 } +2024-07-30 02:44:45,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 782/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 9.92558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:45,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.66004 samples/s/p 3:22:25 } +2024-07-30 02:44:48,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 784/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 9.9249855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:48,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.65991 samples/s/p 3:22:22 } +2024-07-30 02:44:51,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 786/ 3125], loss: 0.095, per_step_time: 1414ms, lr: 9.924388e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:51,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.65450 samples/s/p 3:22:31 } +2024-07-30 02:44:54,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 788/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 9.923788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:54,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.66005 samples/s/p 3:22:17 } +2024-07-30 02:44:57,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 790/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 9.923186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:57,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.65851 samples/s/p 3:22:17 } +2024-07-30 02:45:00,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 792/ 3125], loss: 0.344, per_step_time: 1413ms, lr: 9.922582e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:00,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.65870 samples/s/p 3:22:14 } +2024-07-30 02:45:02,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 794/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 9.921975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:02,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.65960 samples/s/p 3:22:09 } +2024-07-30 02:45:05,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 796/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 9.921366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:05,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.66115 samples/s/p 3:22:03 } +2024-07-30 02:45:08,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 798/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 9.920755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:08,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.65883 samples/s/p 3:22:05 } +2024-07-30 02:45:11,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 800/ 3125], loss: 0.499, per_step_time: 1413ms, lr: 9.920141e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:11,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.65817 samples/s/p 3:22:04 } +2024-07-30 02:45:14,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 802/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 9.919525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:14,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.65880 samples/s/p 3:21:59 } +2024-07-30 02:45:17,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 804/ 3125], loss: 0.189, per_step_time: 1414ms, lr: 9.918906e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:17,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.65658 samples/s/p 3:22:01 } +2024-07-30 02:45:19,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 806/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 9.918285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:19,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.65890 samples/s/p 3:21:54 } +2024-07-30 02:45:22,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 808/ 3125], loss: 0.374, per_step_time: 1415ms, lr: 9.917661e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:22,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.65344 samples/s/p 3:22:02 } +2024-07-30 02:45:25,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 810/ 3125], loss: 0.288, per_step_time: 1421ms, lr: 9.917036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:25,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.62635 samples/s/p 3:22:58 } +2024-07-30 02:45:28,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 812/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 9.916408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:28,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.65845 samples/s/p 3:21:46 } +2024-07-30 02:45:31,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 814/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 9.915778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:31,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.66058 samples/s/p 3:21:39 } +2024-07-30 02:45:34,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 816/ 3125], loss: 0.241, per_step_time: 1416ms, lr: 9.915146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:34,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.64617 samples/s/p 3:22:07 } +2024-07-30 02:45:37,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 818/ 3125], loss: 0.152, per_step_time: 1425ms, lr: 9.91451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:37,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.61203 samples/s/p 3:23:18 } +2024-07-30 02:45:39,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 820/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 9.913872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:39,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.66028 samples/s/p 3:21:31 } +2024-07-30 02:45:42,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 822/ 3125], loss: 0.183, per_step_time: 1418ms, lr: 9.913233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:42,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.64026 samples/s/p 3:22:11 } +2024-07-30 02:45:45,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 824/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 9.912591e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:45,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.66082 samples/s/p 3:21:24 } +2024-07-30 02:45:48,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 826/ 3125], loss: 0.379, per_step_time: 1412ms, lr: 9.911947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:48,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.66225 samples/s/p 3:21:18 } +2024-07-30 02:45:51,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 828/ 3125], loss: 0.211, per_step_time: 1426ms, lr: 9.9112995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:51,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.60860 samples/s/p 3:23:11 } +2024-07-30 02:45:54,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 830/ 3125], loss: 0.451, per_step_time: 1412ms, lr: 9.910651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:54,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.66255 samples/s/p 3:21:12 } +2024-07-30 02:45:56,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 832/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 9.909999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:56,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.65891 samples/s/p 3:21:17 } +2024-07-30 02:45:59,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 834/ 3125], loss: 0.497, per_step_time: 1413ms, lr: 9.909346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:59,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.66051 samples/s/p 3:21:10 } +2024-07-30 02:46:02,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 836/ 3125], loss: 0.101, per_step_time: 1413ms, lr: 9.908689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:02,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.66078 samples/s/p 3:21:07 } +2024-07-30 02:46:05,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 838/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 9.908032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:05,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.66024 samples/s/p 3:21:05 } +2024-07-30 02:46:08,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 840/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 9.90737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:08,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.66153 samples/s/p 3:21:00 } +2024-07-30 02:46:11,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 842/ 3125], loss: 0.334, per_step_time: 1413ms, lr: 9.906707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:11,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.65846 samples/s/p 3:21:04 } +2024-07-30 02:46:13,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 844/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 9.906042e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:13,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.65907 samples/s/p 3:20:59 } +2024-07-30 02:46:16,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 846/ 3125], loss: 0.305, per_step_time: 1417ms, lr: 9.905374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:16,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.64275 samples/s/p 3:21:31 } +2024-07-30 02:46:19,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 848/ 3125], loss: 0.206, per_step_time: 1414ms, lr: 9.904704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:19,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.65715 samples/s/p 3:20:58 } +2024-07-30 02:46:22,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 850/ 3125], loss: 0.367, per_step_time: 1413ms, lr: 9.904032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:22,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.66043 samples/s/p 3:20:48 } +2024-07-30 02:46:25,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 852/ 3125], loss: 0.207, per_step_time: 1414ms, lr: 9.903357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:25,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.65429 samples/s/p 3:20:58 } +2024-07-30 02:46:28,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 854/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 9.902679e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:28,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.66135 samples/s/p 3:20:40 } +2024-07-30 02:46:30,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 856/ 3125], loss: 0.233, per_step_time: 1414ms, lr: 9.902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:30,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.65736 samples/s/p 3:20:46 } +2024-07-30 02:46:33,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 858/ 3125], loss: 0.175, per_step_time: 1416ms, lr: 9.901319e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:33,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.64847 samples/s/p 3:21:02 } +2024-07-30 02:46:36,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 860/ 3125], loss: 0.427, per_step_time: 1414ms, lr: 9.900634e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:36,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.65454 samples/s/p 3:20:46 } +2024-07-30 02:46:39,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 862/ 3125], loss: 0.467, per_step_time: 1413ms, lr: 9.899947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:39,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.65935 samples/s/p 3:20:33 } +2024-07-30 02:46:42,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 864/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 9.899259e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:42,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.65868 samples/s/p 3:20:32 } +2024-07-30 02:46:45,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 866/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 9.8985665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:45,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.66080 samples/s/p 3:20:25 } +2024-07-30 02:46:47,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 868/ 3125], loss: 0.273, per_step_time: 1414ms, lr: 9.8978735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:47,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.65710 samples/s/p 3:20:30 } +2024-07-30 02:46:50,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 870/ 3125], loss: 0.532, per_step_time: 1413ms, lr: 9.897178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:50,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.66094 samples/s/p 3:20:19 } +2024-07-30 02:46:53,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 872/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 9.896479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:53,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.65699 samples/s/p 3:20:24 } +2024-07-30 02:46:56,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 874/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 9.895779e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:56,448 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.65996 samples/s/p 3:20:15 } +2024-07-30 02:46:59,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 876/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 9.895076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:59,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.66085 samples/s/p 3:20:10 } +2024-07-30 02:47:02,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 878/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 9.894371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:02,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.66083 samples/s/p 3:20:08 } +2024-07-30 02:47:04,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 880/ 3125], loss: 0.185, per_step_time: 1414ms, lr: 9.893663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:04,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.65446 samples/s/p 3:20:18 } +2024-07-30 02:47:07,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 882/ 3125], loss: 0.394, per_step_time: 1413ms, lr: 9.892953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:07,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.65935 samples/s/p 3:20:05 } +2024-07-30 02:47:10,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 884/ 3125], loss: 0.114, per_step_time: 1413ms, lr: 9.892241e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:10,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.65822 samples/s/p 3:20:05 } +2024-07-30 02:47:13,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 886/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 9.891526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:13,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.66134 samples/s/p 3:19:55 } +2024-07-30 02:47:16,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 888/ 3125], loss: 0.273, per_step_time: 1415ms, lr: 9.890809e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:16,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.65302 samples/s/p 3:20:10 } +2024-07-30 02:47:19,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 890/ 3125], loss: 0.151, per_step_time: 1412ms, lr: 9.89009e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:19,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.66200 samples/s/p 3:19:48 } +2024-07-30 02:47:21,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 892/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 9.889369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:21,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.65919 samples/s/p 3:19:51 } +2024-07-30 02:47:24,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 894/ 3125], loss: 0.480, per_step_time: 1414ms, lr: 9.888645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:24,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.65663 samples/s/p 3:19:54 } +2024-07-30 02:47:27,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 896/ 3125], loss: 0.519, per_step_time: 1414ms, lr: 9.887918e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:27,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.65640 samples/s/p 3:19:52 } +2024-07-30 02:47:30,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 898/ 3125], loss: 0.440, per_step_time: 1413ms, lr: 9.88719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:30,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.65811 samples/s/p 3:19:45 } +2024-07-30 02:47:33,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 900/ 3125], loss: 0.373, per_step_time: 1412ms, lr: 9.886458e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:33,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.66185 samples/s/p 3:19:34 } +2024-07-30 02:47:36,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 902/ 3125], loss: 0.330, per_step_time: 1413ms, lr: 9.885725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:36,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.65954 samples/s/p 3:19:36 } +2024-07-30 02:47:38,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 904/ 3125], loss: 0.195, per_step_time: 1414ms, lr: 9.8849905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:38,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.65525 samples/s/p 3:19:43 } +2024-07-30 02:47:41,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 906/ 3125], loss: 0.260, per_step_time: 1412ms, lr: 9.884252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:41,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.66214 samples/s/p 3:19:25 } +2024-07-30 02:47:44,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 908/ 3125], loss: 0.134, per_step_time: 1414ms, lr: 9.883512e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:44,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.65724 samples/s/p 3:19:33 } +2024-07-30 02:47:47,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 910/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 9.8827695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:47,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.65889 samples/s/p 3:19:27 } +2024-07-30 02:47:50,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 912/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 9.882025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:50,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.65952 samples/s/p 3:19:22 } +2024-07-30 02:47:53,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 914/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 9.881277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:53,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.66002 samples/s/p 3:19:18 } +2024-07-30 02:47:55,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 916/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 9.8805285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:55,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.66034 samples/s/p 3:19:15 } +2024-07-30 02:47:58,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 918/ 3125], loss: 0.065, per_step_time: 1413ms, lr: 9.879776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:58,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.65916 samples/s/p 3:19:15 } +2024-07-30 02:48:01,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 920/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 9.8790215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:01,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.65920 samples/s/p 3:19:12 } +2024-07-30 02:48:04,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 922/ 3125], loss: 0.426, per_step_time: 1414ms, lr: 9.878265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:04,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.65678 samples/s/p 3:19:14 } +2024-07-30 02:48:07,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 924/ 3125], loss: 0.222, per_step_time: 1414ms, lr: 9.877506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:07,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.65379 samples/s/p 3:19:17 } +2024-07-30 02:48:10,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 926/ 3125], loss: 0.194, per_step_time: 1414ms, lr: 9.876745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:10,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.65759 samples/s/p 3:19:07 } +2024-07-30 02:48:12,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 928/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 9.875981e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:12,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.65836 samples/s/p 3:19:02 } +2024-07-30 02:48:15,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 930/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 9.875215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:15,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.65801 samples/s/p 3:19:00 } +2024-07-30 02:48:18,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 932/ 3125], loss: 0.094, per_step_time: 1413ms, lr: 9.874447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:18,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.66005 samples/s/p 3:18:53 } +2024-07-30 02:48:21,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 934/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 9.873676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:21,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |████ | 5.65547 samples/s/p 3:19:00 } +2024-07-30 02:48:24,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 936/ 3125], loss: 0.248, per_step_time: 1424ms, lr: 9.872903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:24,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |████ | 5.61437 samples/s/p 3:20:24 } +2024-07-30 02:48:27,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 938/ 3125], loss: 0.110, per_step_time: 1413ms, lr: 9.872128e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:27,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.65795 samples/s/p 3:18:49 } +2024-07-30 02:48:30,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 940/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 9.871351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:30,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.65909 samples/s/p 3:18:44 } +2024-07-30 02:48:32,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 942/ 3125], loss: 0.095, per_step_time: 1412ms, lr: 9.8705705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:32,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.66206 samples/s/p 3:18:35 } +2024-07-30 02:48:35,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 944/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 9.869788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:35,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.65871 samples/s/p 3:18:39 } +2024-07-30 02:48:38,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 946/ 3125], loss: 0.311, per_step_time: 1412ms, lr: 9.869004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:38,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.66248 samples/s/p 3:18:28 } +2024-07-30 02:48:41,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 948/ 3125], loss: 0.341, per_step_time: 1413ms, lr: 9.868218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:41,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.65970 samples/s/p 3:18:31 } +2024-07-30 02:48:44,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 950/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 9.867428e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:44,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.66127 samples/s/p 3:18:25 } +2024-07-30 02:48:47,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 952/ 3125], loss: 0.520, per_step_time: 1413ms, lr: 9.866637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:47,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.66035 samples/s/p 3:18:24 } +2024-07-30 02:48:49,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 954/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 9.865843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:49,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.66143 samples/s/p 3:18:19 } +2024-07-30 02:48:52,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 956/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 9.865046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:52,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.65982 samples/s/p 3:18:20 } +2024-07-30 02:48:55,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 958/ 3125], loss: 0.088, per_step_time: 1417ms, lr: 9.864249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:55,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.64542 samples/s/p 3:18:47 } +2024-07-30 02:48:58,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 960/ 3125], loss: 0.254, per_step_time: 1416ms, lr: 9.863448e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:58,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.64874 samples/s/p 3:18:37 } +2024-07-30 02:49:01,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 962/ 3125], loss: 0.118, per_step_time: 1422ms, lr: 9.862644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:01,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.62469 samples/s/p 3:19:25 } +2024-07-30 02:49:04,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 964/ 3125], loss: 0.348, per_step_time: 1413ms, lr: 9.861839e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:04,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.65912 samples/s/p 3:18:10 } +2024-07-30 02:49:06,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 966/ 3125], loss: 0.515, per_step_time: 1413ms, lr: 9.861032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:06,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.65866 samples/s/p 3:18:08 } +2024-07-30 02:49:09,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 968/ 3125], loss: 0.405, per_step_time: 1415ms, lr: 9.860221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:09,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.64997 samples/s/p 3:18:23 } +2024-07-30 02:49:12,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 970/ 3125], loss: 0.535, per_step_time: 1413ms, lr: 9.859409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:12,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.65866 samples/s/p 3:18:02 } +2024-07-30 02:49:15,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 972/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 9.858593e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:15,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.65999 samples/s/p 3:17:57 } +2024-07-30 02:49:18,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 974/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 9.8577775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:18,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.66073 samples/s/p 3:17:52 } +2024-07-30 02:49:21,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 976/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 9.856958e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:21,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.65949 samples/s/p 3:17:52 } +2024-07-30 02:49:23,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 978/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 9.856137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:23,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.66010 samples/s/p 3:17:48 } +2024-07-30 02:49:26,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 980/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 9.855313e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:26,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.66098 samples/s/p 3:17:43 } +2024-07-30 02:49:29,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 982/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 9.854486e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:29,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.65839 samples/s/p 3:17:46 } +2024-07-30 02:49:32,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 984/ 3125], loss: 0.367, per_step_time: 1413ms, lr: 9.8536575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:32,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.65904 samples/s/p 3:17:42 } +2024-07-30 02:49:35,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 986/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 9.852827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:35,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.65948 samples/s/p 3:17:38 } +2024-07-30 02:49:38,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 988/ 3125], loss: 0.293, per_step_time: 1413ms, lr: 9.851993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:38,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.66058 samples/s/p 3:17:33 } +2024-07-30 02:49:40,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 990/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 9.851158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:40,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.65856 samples/s/p 3:17:34 } +2024-07-30 02:49:43,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 992/ 3125], loss: 0.267, per_step_time: 1416ms, lr: 9.85032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:43,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.64598 samples/s/p 3:17:58 } +2024-07-30 02:49:46,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 994/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 9.849479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:46,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.65884 samples/s/p 3:17:28 } +2024-07-30 02:49:49,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 996/ 3125], loss: 0.733, per_step_time: 1414ms, lr: 9.848637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:49,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.65635 samples/s/p 3:17:30 } +2024-07-30 02:49:52,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 998/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 9.847792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:52,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.65583 samples/s/p 3:17:29 } +2024-07-30 02:49:55,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1000/ 3125], loss: 0.555, per_step_time: 1414ms, lr: 9.846945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:55,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.65673 samples/s/p 3:17:24 } +2024-07-30 02:49:57,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1002/ 3125], loss: 0.196, per_step_time: 1415ms, lr: 9.846096e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:57,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.65344 samples/s/p 3:17:28 } +2024-07-30 02:50:00,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1004/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 9.845244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:00,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.65793 samples/s/p 3:17:16 } +2024-07-30 02:50:03,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1006/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 9.84439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:03,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.65753 samples/s/p 3:17:14 } +2024-07-30 02:50:06,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1008/ 3125], loss: 0.251, per_step_time: 1414ms, lr: 9.843533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:06,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.65404 samples/s/p 3:17:18 } +2024-07-30 02:50:09,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1010/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 9.842675e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:09,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.65863 samples/s/p 3:17:06 } +2024-07-30 02:50:12,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1012/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 9.841814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:12,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.65948 samples/s/p 3:17:01 } +2024-07-30 02:50:14,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1014/ 3125], loss: 0.384, per_step_time: 1412ms, lr: 9.840951e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:14,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.66226 samples/s/p 3:16:52 } +2024-07-30 02:50:17,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1016/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 9.840085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:17,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.65952 samples/s/p 3:16:55 } +2024-07-30 02:50:20,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1018/ 3125], loss: 0.232, per_step_time: 1416ms, lr: 9.839217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:20,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.64673 samples/s/p 3:17:19 } +2024-07-30 02:50:23,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1020/ 3125], loss: 0.114, per_step_time: 1413ms, lr: 9.838346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:23,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.65963 samples/s/p 3:16:49 } +2024-07-30 02:50:26,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1022/ 3125], loss: 0.533, per_step_time: 1417ms, lr: 9.837474e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:26,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.64561 samples/s/p 3:17:16 } +2024-07-30 02:50:29,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1024/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 9.836599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:29,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.65979 samples/s/p 3:16:43 } +2024-07-30 02:50:31,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1026/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 9.835722e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:31,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.66137 samples/s/p 3:16:37 } +2024-07-30 02:50:34,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1028/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 9.834843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:34,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.65968 samples/s/p 3:16:38 } +2024-07-30 02:50:37,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1030/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 9.833961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:37,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.66075 samples/s/p 3:16:33 } +2024-07-30 02:50:40,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1032/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 9.833077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:40,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.65980 samples/s/p 3:16:32 } +2024-07-30 02:50:43,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1034/ 3125], loss: 0.209, per_step_time: 1412ms, lr: 9.83219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:43,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.66177 samples/s/p 3:16:25 } +2024-07-30 02:50:46,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1036/ 3125], loss: 0.252, per_step_time: 1412ms, lr: 9.831302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:46,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.66254 samples/s/p 3:16:21 } +2024-07-30 02:50:48,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1038/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 9.83041e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:48,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.65954 samples/s/p 3:16:24 } +2024-07-30 02:50:51,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1040/ 3125], loss: 0.089, per_step_time: 1413ms, lr: 9.829518e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:51,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.66052 samples/s/p 3:16:19 } +2024-07-30 02:50:54,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1042/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 9.828622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:54,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.66050 samples/s/p 3:16:17 } +2024-07-30 02:50:57,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1044/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 9.827724e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:57,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.65993 samples/s/p 3:16:15 } +2024-07-30 02:51:00,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1046/ 3125], loss: 0.345, per_step_time: 1414ms, lr: 9.826823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:00,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.65734 samples/s/p 3:16:17 } +2024-07-30 02:51:03,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1048/ 3125], loss: 0.387, per_step_time: 1414ms, lr: 9.825921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:03,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.65513 samples/s/p 3:16:19 } +2024-07-30 02:51:05,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1050/ 3125], loss: 0.237, per_step_time: 1414ms, lr: 9.825016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:05,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.65692 samples/s/p 3:16:13 } +2024-07-30 02:51:08,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1052/ 3125], loss: 0.115, per_step_time: 1413ms, lr: 9.824109e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:08,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.66066 samples/s/p 3:16:02 } +2024-07-30 02:51:11,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1054/ 3125], loss: 0.151, per_step_time: 1414ms, lr: 9.8231985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:11,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.65675 samples/s/p 3:16:07 } +2024-07-30 02:51:14,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1056/ 3125], loss: 0.353, per_step_time: 1413ms, lr: 9.822287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:14,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.65959 samples/s/p 3:15:59 } +2024-07-30 02:51:17,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1058/ 3125], loss: 0.219, per_step_time: 1416ms, lr: 9.821373e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:17,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.64670 samples/s/p 3:16:23 } +2024-07-30 02:51:20,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1060/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 9.820457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:20,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.66011 samples/s/p 3:15:52 } +2024-07-30 02:51:22,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1062/ 3125], loss: 0.295, per_step_time: 1415ms, lr: 9.819539e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:22,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.65278 samples/s/p 3:16:04 } +2024-07-30 02:51:25,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1064/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 9.8186165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:25,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.66096 samples/s/p 3:15:44 } +2024-07-30 02:51:28,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1066/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 9.817693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:28,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.66091 samples/s/p 3:15:42 } +2024-07-30 02:51:31,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1068/ 3125], loss: 0.271, per_step_time: 1412ms, lr: 9.8167675e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:31,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.66172 samples/s/p 3:15:37 } +2024-07-30 02:51:34,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1070/ 3125], loss: 0.564, per_step_time: 1413ms, lr: 9.815841e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:34,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.65957 samples/s/p 3:15:39 } +2024-07-30 02:51:37,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1072/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 9.81491e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:37,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.66153 samples/s/p 3:15:32 } +2024-07-30 02:51:39,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1074/ 3125], loss: 0.383, per_step_time: 1414ms, lr: 9.813978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:39,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.65600 samples/s/p 3:15:41 } +2024-07-30 02:51:42,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1076/ 3125], loss: 0.429, per_step_time: 1413ms, lr: 9.813043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:42,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.65984 samples/s/p 3:15:30 } +2024-07-30 02:51:45,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1078/ 3125], loss: 0.408, per_step_time: 1413ms, lr: 9.812105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:45,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.66163 samples/s/p 3:15:23 } +2024-07-30 02:51:48,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1080/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 9.811166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:48,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.66130 samples/s/p 3:15:21 } +2024-07-30 02:51:51,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1082/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 9.810225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:51,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.65933 samples/s/p 3:15:22 } +2024-07-30 02:51:54,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1084/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 9.8092805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:54,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.65999 samples/s/p 3:15:18 } +2024-07-30 02:51:56,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1086/ 3125], loss: 0.335, per_step_time: 1412ms, lr: 9.808335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:56,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.66256 samples/s/p 3:15:10 } +2024-07-30 02:51:59,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1088/ 3125], loss: 0.302, per_step_time: 1416ms, lr: 9.807386e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:59,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.64731 samples/s/p 3:15:39 } +2024-07-30 02:52:02,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1090/ 3125], loss: 0.307, per_step_time: 1415ms, lr: 9.806435e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:02,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.65102 samples/s/p 3:15:28 } +2024-07-30 02:52:05,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1092/ 3125], loss: 0.224, per_step_time: 1415ms, lr: 9.8054825e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:05,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.65115 samples/s/p 3:15:25 } +2024-07-30 02:52:08,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1094/ 3125], loss: 0.178, per_step_time: 1415ms, lr: 9.804527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:08,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.65310 samples/s/p 3:15:18 } +2024-07-30 02:52:11,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1096/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 9.803569e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:11,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.66038 samples/s/p 3:15:00 } +2024-07-30 02:52:13,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1098/ 3125], loss: 0.200, per_step_time: 1414ms, lr: 9.8026085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:13,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.65696 samples/s/p 3:15:05 } +2024-07-30 02:52:16,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1100/ 3125], loss: 0.426, per_step_time: 1414ms, lr: 9.801647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:16,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.65695 samples/s/p 3:15:02 } +2024-07-30 02:52:19,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1102/ 3125], loss: 0.628, per_step_time: 1413ms, lr: 9.800682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:19,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.65879 samples/s/p 3:14:55 } +2024-07-30 02:52:22,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1104/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 9.799715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:22,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.66112 samples/s/p 3:14:48 } +2024-07-30 02:52:25,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1106/ 3125], loss: 0.322, per_step_time: 1413ms, lr: 9.798746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:25,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.66046 samples/s/p 3:14:46 } +2024-07-30 02:52:28,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1108/ 3125], loss: 0.553, per_step_time: 1413ms, lr: 9.7977745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:28,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.66066 samples/s/p 3:14:43 } +2024-07-30 02:52:30,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1110/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 9.7968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:30,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.66041 samples/s/p 3:14:41 } +2024-07-30 02:52:33,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1112/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 9.795824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:33,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.65925 samples/s/p 3:14:40 } +2024-07-30 02:52:36,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1114/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 9.794847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:36,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.65951 samples/s/p 3:14:37 } +2024-07-30 02:52:39,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1116/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 9.7938655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:39,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.65946 samples/s/p 3:14:34 } +2024-07-30 02:52:42,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1118/ 3125], loss: 0.401, per_step_time: 1413ms, lr: 9.792882e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:42,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.66111 samples/s/p 3:14:28 } +2024-07-30 02:52:45,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1120/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 9.791896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:45,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.66132 samples/s/p 3:14:25 } +2024-07-30 02:52:47,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1122/ 3125], loss: 0.198, per_step_time: 1414ms, lr: 9.790909e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:47,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |█████ | 5.65671 samples/s/p 3:14:31 } +2024-07-30 02:52:50,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1124/ 3125], loss: 0.094, per_step_time: 1416ms, lr: 9.789919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:50,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |█████ | 5.64785 samples/s/p 3:14:47 } +2024-07-30 02:52:53,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1126/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 9.788928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:53,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.65826 samples/s/p 3:14:22 } +2024-07-30 02:52:56,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1128/ 3125], loss: 0.300, per_step_time: 1417ms, lr: 9.787934e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:56,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.64563 samples/s/p 3:14:46 } +2024-07-30 02:52:59,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1130/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 9.786936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:59,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.66071 samples/s/p 3:14:12 } +2024-07-30 02:53:02,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1132/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 9.785938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:02,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.65794 samples/s/p 3:14:15 } +2024-07-30 02:53:05,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1134/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 9.784937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:05,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.66112 samples/s/p 3:14:05 } +2024-07-30 02:53:07,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1136/ 3125], loss: 0.150, per_step_time: 1412ms, lr: 9.783933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:07,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.66173 samples/s/p 3:14:01 } +2024-07-30 02:53:10,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1138/ 3125], loss: 0.158, per_step_time: 1414ms, lr: 9.782927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:10,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.65553 samples/s/p 3:14:11 } +2024-07-30 02:53:13,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1140/ 3125], loss: 0.321, per_step_time: 1413ms, lr: 9.781919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:13,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.65956 samples/s/p 3:14:00 } +2024-07-30 02:53:16,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1142/ 3125], loss: 0.248, per_step_time: 1414ms, lr: 9.780909e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:16,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.65722 samples/s/p 3:14:02 } +2024-07-30 02:53:19,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1144/ 3125], loss: 0.359, per_step_time: 1415ms, lr: 9.779896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:19,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.65331 samples/s/p 3:14:07 } +2024-07-30 02:53:22,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1146/ 3125], loss: 0.302, per_step_time: 1414ms, lr: 9.778881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:22,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.65744 samples/s/p 3:13:56 } +2024-07-30 02:53:24,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1148/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 9.777864e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:24,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.65909 samples/s/p 3:13:50 } +2024-07-30 02:53:27,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1150/ 3125], loss: 0.211, per_step_time: 1414ms, lr: 9.776844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:27,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.65623 samples/s/p 3:13:53 } +2024-07-30 02:53:30,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1152/ 3125], loss: 0.408, per_step_time: 1413ms, lr: 9.775823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:30,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.65971 samples/s/p 3:13:43 } +2024-07-30 02:53:33,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1154/ 3125], loss: 0.170, per_step_time: 1414ms, lr: 9.774798e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:33,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.65708 samples/s/p 3:13:45 } +2024-07-30 02:53:36,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1156/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 9.773771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:36,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.65810 samples/s/p 3:13:40 } +2024-07-30 02:53:39,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1158/ 3125], loss: 0.134, per_step_time: 1413ms, lr: 9.772743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:39,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.66042 samples/s/p 3:13:33 } +2024-07-30 02:53:41,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1160/ 3125], loss: 0.465, per_step_time: 1412ms, lr: 9.771713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:41,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.66198 samples/s/p 3:13:27 } +2024-07-30 02:53:44,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1162/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 9.770679e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:44,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.65786 samples/s/p 3:13:32 } +2024-07-30 02:53:47,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1164/ 3125], loss: 0.082, per_step_time: 1413ms, lr: 9.769644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:47,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.65834 samples/s/p 3:13:29 } +2024-07-30 02:53:50,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1166/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 9.768606e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:50,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.66138 samples/s/p 3:13:20 } +2024-07-30 02:53:53,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1168/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 9.767566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:53,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.65972 samples/s/p 3:13:20 } +2024-07-30 02:53:56,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1170/ 3125], loss: 0.246, per_step_time: 1412ms, lr: 9.766523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:56,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.66199 samples/s/p 3:13:13 } +2024-07-30 02:53:58,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1172/ 3125], loss: 0.307, per_step_time: 1414ms, lr: 9.765479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:58,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.65738 samples/s/p 3:13:19 } +2024-07-30 02:54:01,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1174/ 3125], loss: 0.124, per_step_time: 1416ms, lr: 9.764432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:01,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.64896 samples/s/p 3:13:34 } +2024-07-30 02:54:04,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1176/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 9.763384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:04,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.65948 samples/s/p 3:13:09 } +2024-07-30 02:54:07,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1178/ 3125], loss: 0.391, per_step_time: 1414ms, lr: 9.762332e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:07,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.65437 samples/s/p 3:13:17 } +2024-07-30 02:54:10,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1180/ 3125], loss: 0.177, per_step_time: 1414ms, lr: 9.761278e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:10,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.65546 samples/s/p 3:13:12 } +2024-07-30 02:54:13,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1182/ 3125], loss: 0.174, per_step_time: 1414ms, lr: 9.760222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:13,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.65707 samples/s/p 3:13:06 } +2024-07-30 02:54:15,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1184/ 3125], loss: 0.159, per_step_time: 1414ms, lr: 9.759164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:15,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.65581 samples/s/p 3:13:05 } +2024-07-30 02:54:18,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1186/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 9.758104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:18,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.65930 samples/s/p 3:12:55 } +2024-07-30 02:54:21,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1188/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 9.75704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:21,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.65965 samples/s/p 3:12:52 } +2024-07-30 02:54:24,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1190/ 3125], loss: 0.580, per_step_time: 1412ms, lr: 9.755976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:24,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.66173 samples/s/p 3:12:45 } +2024-07-30 02:54:27,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1192/ 3125], loss: 0.446, per_step_time: 1413ms, lr: 9.754908e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:27,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.65844 samples/s/p 3:12:49 } +2024-07-30 02:54:30,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1194/ 3125], loss: 0.293, per_step_time: 1413ms, lr: 9.75384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:30,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.65978 samples/s/p 3:12:43 } +2024-07-30 02:54:32,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1196/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 9.752767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:32,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.66069 samples/s/p 3:12:39 } +2024-07-30 02:54:35,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1198/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 9.751693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:35,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.65857 samples/s/p 3:12:40 } +2024-07-30 02:54:38,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1200/ 3125], loss: 0.244, per_step_time: 1414ms, lr: 9.750616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:38,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.65659 samples/s/p 3:12:41 } +2024-07-30 02:54:41,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1202/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 9.749538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:41,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.66062 samples/s/p 3:12:30 } +2024-07-30 02:54:44,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1204/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 9.748457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:44,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.66109 samples/s/p 3:12:26 } +2024-07-30 02:54:47,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1206/ 3125], loss: 0.336, per_step_time: 1414ms, lr: 9.747374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:47,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.65723 samples/s/p 3:12:31 } +2024-07-30 02:54:49,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1208/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 9.746288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:49,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.65981 samples/s/p 3:12:23 } +2024-07-30 02:54:52,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1210/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 9.7452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:52,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.66054 samples/s/p 3:12:19 } +2024-07-30 02:54:55,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1212/ 3125], loss: 0.112, per_step_time: 1414ms, lr: 9.744111e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:55,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.65728 samples/s/p 3:12:23 } +2024-07-30 02:54:58,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1214/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 9.7430175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:58,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.66054 samples/s/p 3:12:13 } +2024-07-30 02:55:01,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1216/ 3125], loss: 0.415, per_step_time: 1413ms, lr: 9.741923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:01,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.66013 samples/s/p 3:12:11 } +2024-07-30 02:55:04,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1218/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 9.7408265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:04,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.66057 samples/s/p 3:12:08 } +2024-07-30 02:55:06,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1220/ 3125], loss: 0.406, per_step_time: 1414ms, lr: 9.739729e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:06,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.65687 samples/s/p 3:12:12 } +2024-07-30 02:55:09,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1222/ 3125], loss: 0.280, per_step_time: 1414ms, lr: 9.738626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:09,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.65538 samples/s/p 3:12:13 } +2024-07-30 02:55:12,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1224/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 9.737523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:12,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.65842 samples/s/p 3:12:04 } +2024-07-30 02:55:15,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1226/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 9.736417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:15,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.66012 samples/s/p 3:11:57 } +2024-07-30 02:55:18,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1228/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 9.7353095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:18,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.66042 samples/s/p 3:11:54 } +2024-07-30 02:55:21,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1230/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 9.734199e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:21,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.65983 samples/s/p 3:11:52 } +2024-07-30 02:55:23,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1232/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 9.733087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:23,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.65806 samples/s/p 3:11:53 } +2024-07-30 02:55:26,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1234/ 3125], loss: 0.403, per_step_time: 1414ms, lr: 9.731971e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:26,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.65551 samples/s/p 3:11:55 } +2024-07-30 02:55:29,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1236/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 9.730855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:29,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.65842 samples/s/p 3:11:47 } +2024-07-30 02:55:32,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1238/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 9.729735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:32,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.66022 samples/s/p 3:11:40 } +2024-07-30 02:55:35,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1240/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 9.728614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:35,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.66032 samples/s/p 3:11:37 } +2024-07-30 02:55:38,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1242/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 9.727489e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:38,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.65944 samples/s/p 3:11:36 } +2024-07-30 02:55:40,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1244/ 3125], loss: 0.158, per_step_time: 1412ms, lr: 9.726363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:40,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.66176 samples/s/p 3:11:29 } +2024-07-30 02:55:43,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1246/ 3125], loss: 0.466, per_step_time: 1414ms, lr: 9.725235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:43,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.65677 samples/s/p 3:11:36 } +2024-07-30 02:55:46,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1248/ 3125], loss: 0.301, per_step_time: 1413ms, lr: 9.7241045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:46,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.66093 samples/s/p 3:11:25 } +2024-07-30 02:55:49,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1250/ 3125], loss: 0.301, per_step_time: 1415ms, lr: 9.722971e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:49,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.65092 samples/s/p 3:11:42 } +2024-07-30 02:55:52,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1252/ 3125], loss: 0.246, per_step_time: 1415ms, lr: 9.721835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:52,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.65339 samples/s/p 3:11:34 } +2024-07-30 02:55:55,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1254/ 3125], loss: 0.269, per_step_time: 1414ms, lr: 9.7206985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:55,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.65566 samples/s/p 3:11:27 } +2024-07-30 02:55:57,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1256/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 9.719559e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:57,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.66155 samples/s/p 3:11:12 } +2024-07-30 02:56:00,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1258/ 3125], loss: 0.373, per_step_time: 1413ms, lr: 9.718417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:00,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.66086 samples/s/p 3:11:11 } +2024-07-30 02:56:03,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1260/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 9.717272e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:03,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.66005 samples/s/p 3:11:09 } +2024-07-30 02:56:06,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1262/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 9.716126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:06,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.66019 samples/s/p 3:11:06 } +2024-07-30 02:56:09,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1264/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 9.714978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:09,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.66032 samples/s/p 3:11:03 } +2024-07-30 02:56:12,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1266/ 3125], loss: 0.501, per_step_time: 1413ms, lr: 9.713827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:12,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.66033 samples/s/p 3:11:00 } +2024-07-30 02:56:14,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1268/ 3125], loss: 0.166, per_step_time: 1417ms, lr: 9.712674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:14,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.64189 samples/s/p 3:11:35 } +2024-07-30 02:56:17,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1270/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 9.711518e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:17,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.65946 samples/s/p 3:10:56 } +2024-07-30 02:56:20,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1272/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 9.71036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:20,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.65894 samples/s/p 3:10:55 } +2024-07-30 02:56:23,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1274/ 3125], loss: 0.331, per_step_time: 1414ms, lr: 9.709201e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:23,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.65769 samples/s/p 3:10:54 } +2024-07-30 02:56:26,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1276/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 9.708038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:26,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.65960 samples/s/p 3:10:48 } +2024-07-30 02:56:29,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1278/ 3125], loss: 0.248, per_step_time: 1414ms, lr: 9.706873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:29,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.65688 samples/s/p 3:10:50 } +2024-07-30 02:56:31,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1280/ 3125], loss: 0.137, per_step_time: 1413ms, lr: 9.705706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:31,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.65818 samples/s/p 3:10:45 } +2024-07-30 02:56:34,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1282/ 3125], loss: 0.208, per_step_time: 1415ms, lr: 9.704539e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:34,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.65201 samples/s/p 3:10:55 } +2024-07-30 02:56:37,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1284/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 9.703367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:37,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.65967 samples/s/p 3:10:36 } +2024-07-30 02:56:40,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1286/ 3125], loss: 0.480, per_step_time: 1416ms, lr: 9.702194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:40,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.64897 samples/s/p 3:10:55 } +2024-07-30 02:56:43,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1288/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 9.701018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:43,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.66057 samples/s/p 3:10:29 } +2024-07-30 02:56:46,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1290/ 3125], loss: 0.396, per_step_time: 1412ms, lr: 9.69984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:46,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.66239 samples/s/p 3:10:22 } +2024-07-30 02:56:48,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1292/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 9.6986605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:48,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.65977 samples/s/p 3:10:25 } +2024-07-30 02:56:51,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1294/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 9.697477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:51,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.65860 samples/s/p 3:10:24 } +2024-07-30 02:56:54,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1296/ 3125], loss: 0.200, per_step_time: 1414ms, lr: 9.696292e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:54,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.65738 samples/s/p 3:10:24 } +2024-07-30 02:56:57,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1298/ 3125], loss: 0.426, per_step_time: 1413ms, lr: 9.695105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:57,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.65982 samples/s/p 3:10:16 } +2024-07-30 02:57:00,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1300/ 3125], loss: 0.553, per_step_time: 1418ms, lr: 9.693917e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:00,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.63952 samples/s/p 3:10:54 } +2024-07-30 02:57:03,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1302/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 9.692725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:03,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.66083 samples/s/p 3:10:08 } +2024-07-30 02:57:05,991 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1304/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 9.691531e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:05,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.66095 samples/s/p 3:10:05 } +2024-07-30 02:57:08,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1306/ 3125], loss: 0.382, per_step_time: 1413ms, lr: 9.690336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:08,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.66113 samples/s/p 3:10:02 } +2024-07-30 02:57:11,660 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1308/ 3125], loss: 0.329, per_step_time: 1414ms, lr: 9.689138e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:11,660 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.65724 samples/s/p 3:10:07 } +2024-07-30 02:57:14,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1310/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 9.687938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:14,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.66017 samples/s/p 3:09:58 } +2024-07-30 02:57:17,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1312/ 3125], loss: 0.122, per_step_time: 1413ms, lr: 9.686734e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:17,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.66075 samples/s/p 3:09:54 } +2024-07-30 02:57:20,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1314/ 3125], loss: 0.244, per_step_time: 1414ms, lr: 9.685529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:20,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |███████ | 5.65770 samples/s/p 3:09:58 } +2024-07-30 02:57:22,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1316/ 3125], loss: 0.242, per_step_time: 1414ms, lr: 9.684323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:22,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |███████ | 5.65532 samples/s/p 3:10:00 } +2024-07-30 02:57:25,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1318/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 9.683114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:25,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.66150 samples/s/p 3:09:44 } +2024-07-30 02:57:28,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1320/ 3125], loss: 0.338, per_step_time: 1414ms, lr: 9.681902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:28,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.65749 samples/s/p 3:09:50 } +2024-07-30 02:57:31,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1322/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 9.680688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:31,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.66119 samples/s/p 3:09:39 } +2024-07-30 02:57:34,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1324/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 9.679472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:34,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.66158 samples/s/p 3:09:36 } +2024-07-30 02:57:37,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1326/ 3125], loss: 0.458, per_step_time: 1413ms, lr: 9.678254e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:37,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.66011 samples/s/p 3:09:36 } +2024-07-30 02:57:40,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1328/ 3125], loss: 0.322, per_step_time: 1414ms, lr: 9.677034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:40,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.65619 samples/s/p 3:09:41 } +2024-07-30 02:57:42,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1330/ 3125], loss: 0.384, per_step_time: 1413ms, lr: 9.67581e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:42,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.65815 samples/s/p 3:09:34 } +2024-07-30 02:57:45,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1332/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 9.674586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:45,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.66050 samples/s/p 3:09:27 } +2024-07-30 02:57:48,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1334/ 3125], loss: 0.160, per_step_time: 1413ms, lr: 9.673359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:48,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.65864 samples/s/p 3:09:28 } +2024-07-30 02:57:51,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1336/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 9.67213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:51,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.65494 samples/s/p 3:09:32 } +2024-07-30 02:57:54,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1338/ 3125], loss: 0.599, per_step_time: 1413ms, lr: 9.670897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:54,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.66064 samples/s/p 3:09:18 } +2024-07-30 02:57:57,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1340/ 3125], loss: 0.408, per_step_time: 1415ms, lr: 9.669664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:57,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.65318 samples/s/p 3:09:30 } +2024-07-30 02:57:59,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1342/ 3125], loss: 0.279, per_step_time: 1412ms, lr: 9.668427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:59,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.66185 samples/s/p 3:09:10 } +2024-07-30 02:58:02,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1344/ 3125], loss: 0.351, per_step_time: 1414ms, lr: 9.667189e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:02,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.65729 samples/s/p 3:09:16 } +2024-07-30 02:58:05,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1346/ 3125], loss: 0.354, per_step_time: 1412ms, lr: 9.665949e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:05,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.66220 samples/s/p 3:09:04 } +2024-07-30 02:58:08,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1348/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 9.664705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:08,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.66051 samples/s/p 3:09:04 } +2024-07-30 02:58:11,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1350/ 3125], loss: 0.249, per_step_time: 1412ms, lr: 9.663461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:11,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.66469 samples/s/p 3:08:53 } +2024-07-30 02:58:14,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1352/ 3125], loss: 0.442, per_step_time: 1413ms, lr: 9.662214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:14,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.65909 samples/s/p 3:09:01 } +2024-07-30 02:58:16,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1354/ 3125], loss: 0.305, per_step_time: 1412ms, lr: 9.660965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:16,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.66225 samples/s/p 3:08:52 } +2024-07-30 02:58:19,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1356/ 3125], loss: 0.162, per_step_time: 1414ms, lr: 9.659713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:19,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.65726 samples/s/p 3:08:59 } +2024-07-30 02:58:22,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1358/ 3125], loss: 0.118, per_step_time: 1413ms, lr: 9.658459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:22,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.66109 samples/s/p 3:08:49 } +2024-07-30 02:58:25,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1360/ 3125], loss: 0.098, per_step_time: 1425ms, lr: 9.657203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:25,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.61287 samples/s/p 3:10:23 } +2024-07-30 02:58:28,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1362/ 3125], loss: 0.471, per_step_time: 1413ms, lr: 9.655945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:28,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.66025 samples/s/p 3:08:45 } +2024-07-30 02:58:31,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1364/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 9.654684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:31,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.66040 samples/s/p 3:08:42 } +2024-07-30 02:58:33,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1366/ 3125], loss: 0.345, per_step_time: 1414ms, lr: 9.65342e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:33,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.65767 samples/s/p 3:08:44 } +2024-07-30 02:58:36,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1368/ 3125], loss: 0.169, per_step_time: 1413ms, lr: 9.652156e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:36,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.65959 samples/s/p 3:08:38 } +2024-07-30 02:58:39,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1370/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 9.650888e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:39,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.66005 samples/s/p 3:08:34 } +2024-07-30 02:58:42,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1372/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 9.64962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:42,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.66103 samples/s/p 3:08:29 } +2024-07-30 02:58:45,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1374/ 3125], loss: 0.228, per_step_time: 1412ms, lr: 9.648348e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:45,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.66179 samples/s/p 3:08:25 } +2024-07-30 02:58:48,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1376/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 9.647073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:48,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.65934 samples/s/p 3:08:27 } +2024-07-30 02:58:50,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1378/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 9.645798e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:50,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.65874 samples/s/p 3:08:25 } +2024-07-30 02:58:53,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1380/ 3125], loss: 0.612, per_step_time: 1413ms, lr: 9.64452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:53,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.66037 samples/s/p 3:08:19 } +2024-07-30 02:58:56,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1382/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 9.643239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:56,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.65812 samples/s/p 3:08:21 } +2024-07-30 02:58:59,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1384/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 9.641956e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:59,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.65916 samples/s/p 3:08:16 } +2024-07-30 02:59:02,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1386/ 3125], loss: 0.271, per_step_time: 1415ms, lr: 9.640671e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:02,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.65215 samples/s/p 3:08:27 } +2024-07-30 02:59:05,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1388/ 3125], loss: 0.386, per_step_time: 1414ms, lr: 9.639384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:05,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.65686 samples/s/p 3:08:15 } +2024-07-30 02:59:07,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1390/ 3125], loss: 0.425, per_step_time: 1413ms, lr: 9.6380945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:07,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.66115 samples/s/p 3:08:03 } +2024-07-30 02:59:10,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1392/ 3125], loss: 0.252, per_step_time: 1416ms, lr: 9.636802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:10,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.64775 samples/s/p 3:08:27 } +2024-07-30 02:59:13,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1394/ 3125], loss: 0.226, per_step_time: 1414ms, lr: 9.635509e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:13,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.65666 samples/s/p 3:08:07 } +2024-07-30 02:59:16,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1396/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 9.634213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:16,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.66053 samples/s/p 3:07:56 } +2024-07-30 02:59:19,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1398/ 3125], loss: 0.431, per_step_time: 1413ms, lr: 9.632915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:19,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.66040 samples/s/p 3:07:54 } +2024-07-30 02:59:22,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1400/ 3125], loss: 0.280, per_step_time: 1414ms, lr: 9.6316135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:22,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.65698 samples/s/p 3:07:58 } +2024-07-30 02:59:22,059 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 02:59:56,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1402/ 3125], loss: 0.537, per_step_time: 2144ms, lr: 9.630311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:56,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 3.73120 samples/s/p 4:44:54 } +2024-07-30 02:59:59,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1404/ 3125], loss: 0.321, per_step_time: 1414ms, lr: 9.629006e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:59,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.65763 samples/s/p 3:07:51 } +2024-07-30 03:00:02,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1406/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 9.6277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:02,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.65879 samples/s/p 3:07:46 } +2024-07-30 03:00:05,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1408/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 9.62639e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:05,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.65942 samples/s/p 3:07:41 } +2024-07-30 03:00:08,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1410/ 3125], loss: 0.320, per_step_time: 1414ms, lr: 9.625078e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:08,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.65491 samples/s/p 3:07:48 } +2024-07-30 03:00:11,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1412/ 3125], loss: 0.263, per_step_time: 1415ms, lr: 9.6237645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:11,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.65117 samples/s/p 3:07:52 } +2024-07-30 03:00:14,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1414/ 3125], loss: 0.153, per_step_time: 1414ms, lr: 9.6224485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:14,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.65663 samples/s/p 3:07:39 } +2024-07-30 03:00:17,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1416/ 3125], loss: 0.109, per_step_time: 1413ms, lr: 9.621131e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:17,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.66013 samples/s/p 3:07:29 } +2024-07-30 03:00:19,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1418/ 3125], loss: 0.217, per_step_time: 1412ms, lr: 9.61981e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:19,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.66248 samples/s/p 3:07:21 } +2024-07-30 03:00:22,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1420/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 9.618488e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:22,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.66074 samples/s/p 3:07:22 } +2024-07-30 03:00:25,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1422/ 3125], loss: 0.702, per_step_time: 1413ms, lr: 9.617163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:25,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.66108 samples/s/p 3:07:18 } +2024-07-30 03:00:28,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1424/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 9.615836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:28,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.65927 samples/s/p 3:07:19 } +2024-07-30 03:00:31,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1426/ 3125], loss: 0.307, per_step_time: 1414ms, lr: 9.614508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:31,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.65671 samples/s/p 3:07:21 } +2024-07-30 03:00:34,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1428/ 3125], loss: 0.406, per_step_time: 1413ms, lr: 9.613175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:34,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.65962 samples/s/p 3:07:13 } +2024-07-30 03:00:36,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1430/ 3125], loss: 0.338, per_step_time: 1412ms, lr: 9.611842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:36,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.66210 samples/s/p 3:07:05 } +2024-07-30 03:00:39,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1432/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 9.610506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:39,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.65932 samples/s/p 3:07:08 } +2024-07-30 03:00:42,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1434/ 3125], loss: 0.264, per_step_time: 1416ms, lr: 9.609167e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:42,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.64906 samples/s/p 3:07:25 } +2024-07-30 03:00:45,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1436/ 3125], loss: 0.493, per_step_time: 1413ms, lr: 9.607828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:45,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.65963 samples/s/p 3:07:01 } +2024-07-30 03:00:48,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1438/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 9.606485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:48,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.66127 samples/s/p 3:06:55 } +2024-07-30 03:00:51,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1440/ 3125], loss: 0.302, per_step_time: 1412ms, lr: 9.605141e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:51,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.66210 samples/s/p 3:06:51 } +2024-07-30 03:00:53,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1442/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 9.603795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:53,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.66092 samples/s/p 3:06:50 } +2024-07-30 03:00:56,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1444/ 3125], loss: 0.148, per_step_time: 1418ms, lr: 9.602445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:56,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.63899 samples/s/p 3:07:31 } +2024-07-30 03:00:59,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1446/ 3125], loss: 0.254, per_step_time: 1415ms, lr: 9.601094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:59,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.64994 samples/s/p 3:07:07 } +2024-07-30 03:01:02,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1448/ 3125], loss: 0.198, per_step_time: 1416ms, lr: 9.599741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:02,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.64803 samples/s/p 3:07:07 } +2024-07-30 03:01:05,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1450/ 3125], loss: 0.306, per_step_time: 1419ms, lr: 9.598385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:05,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.63467 samples/s/p 3:07:31 } +2024-07-30 03:01:08,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1452/ 3125], loss: 0.187, per_step_time: 1421ms, lr: 9.597027e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:08,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.62932 samples/s/p 3:07:39 } +2024-07-30 03:01:10,991 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1454/ 3125], loss: 0.147, per_step_time: 1419ms, lr: 9.595667e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:10,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.63693 samples/s/p 3:07:21 } +2024-07-30 03:01:13,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1456/ 3125], loss: 0.250, per_step_time: 1427ms, lr: 9.594305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:13,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.60370 samples/s/p 3:08:25 } +2024-07-30 03:01:16,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1458/ 3125], loss: 0.402, per_step_time: 1418ms, lr: 9.592941e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:16,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.63894 samples/s/p 3:07:11 } +2024-07-30 03:01:19,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1460/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 9.591575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:19,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.65896 samples/s/p 3:06:29 } +2024-07-30 03:01:22,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1462/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 9.590206e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:22,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.65846 samples/s/p 3:06:27 } +2024-07-30 03:01:25,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1464/ 3125], loss: 0.263, per_step_time: 1414ms, lr: 9.588835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:25,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.65765 samples/s/p 3:06:26 } +2024-07-30 03:01:28,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1466/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 9.587462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:28,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.65933 samples/s/p 3:06:20 } +2024-07-30 03:01:30,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1468/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 9.586086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:30,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.65739 samples/s/p 3:06:21 } +2024-07-30 03:01:33,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1470/ 3125], loss: 0.303, per_step_time: 1414ms, lr: 9.584708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:33,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.65509 samples/s/p 3:06:22 } +2024-07-30 03:01:36,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1472/ 3125], loss: 0.148, per_step_time: 1413ms, lr: 9.583328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:36,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.65882 samples/s/p 3:06:12 } +2024-07-30 03:01:39,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1474/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 9.581947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:39,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.66066 samples/s/p 3:06:06 } +2024-07-30 03:01:42,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1476/ 3125], loss: 0.335, per_step_time: 1416ms, lr: 9.580563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:42,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.64777 samples/s/p 3:06:28 } +2024-07-30 03:01:45,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1478/ 3125], loss: 0.367, per_step_time: 1413ms, lr: 9.579177e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:45,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.65910 samples/s/p 3:06:03 } +2024-07-30 03:01:47,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1480/ 3125], loss: 0.177, per_step_time: 1419ms, lr: 9.577788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:47,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.63655 samples/s/p 3:06:45 } +2024-07-30 03:01:50,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1482/ 3125], loss: 0.156, per_step_time: 1419ms, lr: 9.576398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:50,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.63727 samples/s/p 3:06:41 } +2024-07-30 03:01:53,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1484/ 3125], loss: 0.288, per_step_time: 1414ms, lr: 9.575005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:53,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.65471 samples/s/p 3:06:03 } +2024-07-30 03:01:56,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1486/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 9.5736095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:56,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.65447 samples/s/p 3:06:01 } +2024-07-30 03:01:59,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1488/ 3125], loss: 0.203, per_step_time: 1416ms, lr: 9.572213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:59,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.64654 samples/s/p 3:06:14 } +2024-07-30 03:02:02,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1490/ 3125], loss: 0.331, per_step_time: 1412ms, lr: 9.570813e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:02,089 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.66277 samples/s/p 3:05:39 } +2024-07-30 03:02:04,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1492/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 9.569411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:04,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.65773 samples/s/p 3:05:46 } +2024-07-30 03:02:07,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1494/ 3125], loss: 0.445, per_step_time: 1413ms, lr: 9.568008e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:07,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.66124 samples/s/p 3:05:36 } +2024-07-30 03:02:10,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1496/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 9.566602e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:10,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |███████ | 5.65591 samples/s/p 3:05:44 } +2024-07-30 03:02:13,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1498/ 3125], loss: 0.205, per_step_time: 1414ms, lr: 9.565194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:13,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |███████ | 5.65602 samples/s/p 3:05:41 } +2024-07-30 03:02:16,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1500/ 3125], loss: 0.385, per_step_time: 1413ms, lr: 9.563783e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:16,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.65891 samples/s/p 3:05:32 } +2024-07-30 03:02:19,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1502/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 9.562372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:19,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.65987 samples/s/p 3:05:28 } +2024-07-30 03:02:21,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1504/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 9.560956e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:21,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.65919 samples/s/p 3:05:26 } +2024-07-30 03:02:24,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1506/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 9.55954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:24,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.66126 samples/s/p 3:05:19 } +2024-07-30 03:02:27,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1508/ 3125], loss: 0.276, per_step_time: 1414ms, lr: 9.558121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:27,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.65729 samples/s/p 3:05:24 } +2024-07-30 03:02:30,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1510/ 3125], loss: 0.249, per_step_time: 1416ms, lr: 9.556699e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:30,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.64847 samples/s/p 3:05:39 } +2024-07-30 03:02:33,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1512/ 3125], loss: 0.125, per_step_time: 1414ms, lr: 9.555276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:33,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.65722 samples/s/p 3:05:19 } +2024-07-30 03:02:36,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1514/ 3125], loss: 0.294, per_step_time: 1413ms, lr: 9.553851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:36,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.66043 samples/s/p 3:05:10 } +2024-07-30 03:02:38,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1516/ 3125], loss: 0.127, per_step_time: 1413ms, lr: 9.552423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:38,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.65889 samples/s/p 3:05:10 } +2024-07-30 03:02:41,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1518/ 3125], loss: 0.398, per_step_time: 1415ms, lr: 9.550993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:41,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.65264 samples/s/p 3:05:19 } +2024-07-30 03:02:44,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1520/ 3125], loss: 0.232, per_step_time: 1412ms, lr: 9.549562e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:44,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.66283 samples/s/p 3:04:56 } +2024-07-30 03:02:47,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1522/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 9.548126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:47,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.65906 samples/s/p 3:05:01 } +2024-07-30 03:02:50,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1524/ 3125], loss: 0.348, per_step_time: 1413ms, lr: 9.54669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:50,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.65950 samples/s/p 3:04:57 } +2024-07-30 03:02:53,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1526/ 3125], loss: 0.343, per_step_time: 1415ms, lr: 9.545252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:53,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.65285 samples/s/p 3:05:08 } +2024-07-30 03:02:55,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1528/ 3125], loss: 0.208, per_step_time: 1414ms, lr: 9.543812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:55,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.65752 samples/s/p 3:04:56 } +2024-07-30 03:02:58,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1530/ 3125], loss: 0.642, per_step_time: 1413ms, lr: 9.542368e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:58,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.65984 samples/s/p 3:04:48 } +2024-07-30 03:03:01,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1532/ 3125], loss: 0.652, per_step_time: 1414ms, lr: 9.540923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:01,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.65404 samples/s/p 3:04:57 } +2024-07-30 03:03:04,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1534/ 3125], loss: 0.135, per_step_time: 1414ms, lr: 9.539476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:04,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.65474 samples/s/p 3:04:53 } +2024-07-30 03:03:07,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1536/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 9.5380265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:07,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.65883 samples/s/p 3:04:42 } +2024-07-30 03:03:10,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1538/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 9.536576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:10,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.66007 samples/s/p 3:04:36 } +2024-07-30 03:03:12,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1540/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 9.5351215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:12,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.66002 samples/s/p 3:04:34 } +2024-07-30 03:03:15,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1542/ 3125], loss: 0.086, per_step_time: 1413ms, lr: 9.533665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:15,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.65994 samples/s/p 3:04:31 } +2024-07-30 03:03:18,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1544/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 9.532207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:18,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.66019 samples/s/p 3:04:28 } +2024-07-30 03:03:21,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1546/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 9.530747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:21,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.66088 samples/s/p 3:04:24 } +2024-07-30 03:03:24,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1548/ 3125], loss: 0.397, per_step_time: 1413ms, lr: 9.529285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:24,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.65965 samples/s/p 3:04:23 } +2024-07-30 03:03:27,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1550/ 3125], loss: 0.290, per_step_time: 1412ms, lr: 9.52782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:27,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.66304 samples/s/p 3:04:14 } +2024-07-30 03:03:29,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1552/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 9.526354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:29,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.65953 samples/s/p 3:04:18 } +2024-07-30 03:03:32,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1554/ 3125], loss: 0.239, per_step_time: 1414ms, lr: 9.524885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:32,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.65468 samples/s/p 3:04:24 } +2024-07-30 03:03:35,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1556/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 9.5234145e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:35,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.66113 samples/s/p 3:04:09 } +2024-07-30 03:03:38,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1558/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 9.52194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:38,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.66004 samples/s/p 3:04:08 } +2024-07-30 03:03:41,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1560/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 9.520465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:41,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.66167 samples/s/p 3:04:02 } +2024-07-30 03:03:44,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1562/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 9.518988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:44,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.65976 samples/s/p 3:04:03 } +2024-07-30 03:03:46,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1564/ 3125], loss: 0.299, per_step_time: 1414ms, lr: 9.517508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:46,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.65718 samples/s/p 3:04:05 } +2024-07-30 03:03:49,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1566/ 3125], loss: 0.421, per_step_time: 1414ms, lr: 9.516027e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:49,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.65728 samples/s/p 3:04:02 } +2024-07-30 03:03:52,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1568/ 3125], loss: 0.267, per_step_time: 1414ms, lr: 9.514542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:52,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.65760 samples/s/p 3:03:59 } +2024-07-30 03:03:55,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1570/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 9.513056e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:55,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.65850 samples/s/p 3:03:54 } +2024-07-30 03:03:58,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1572/ 3125], loss: 0.147, per_step_time: 1414ms, lr: 9.511568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:58,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.65438 samples/s/p 3:03:59 } +2024-07-30 03:04:01,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1574/ 3125], loss: 0.243, per_step_time: 1414ms, lr: 9.510079e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:01,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.65756 samples/s/p 3:03:50 } +2024-07-30 03:04:04,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1576/ 3125], loss: 0.207, per_step_time: 1425ms, lr: 9.508584e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:04,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.61200 samples/s/p 3:05:17 } +2024-07-30 03:04:06,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1578/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 9.50709e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:06,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.66050 samples/s/p 3:03:39 } +2024-07-30 03:04:09,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1580/ 3125], loss: 0.272, per_step_time: 1414ms, lr: 9.505594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:09,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.65696 samples/s/p 3:03:43 } +2024-07-30 03:04:12,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1582/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 9.504094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:12,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.65836 samples/s/p 3:03:38 } +2024-07-30 03:04:15,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1584/ 3125], loss: 0.315, per_step_time: 1414ms, lr: 9.5025935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:15,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.65544 samples/s/p 3:03:40 } +2024-07-30 03:04:18,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1586/ 3125], loss: 0.383, per_step_time: 1416ms, lr: 9.50109e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:18,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.64872 samples/s/p 3:03:51 } +2024-07-30 03:04:21,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1588/ 3125], loss: 0.414, per_step_time: 1414ms, lr: 9.499584e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:21,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.65693 samples/s/p 3:03:32 } +2024-07-30 03:04:23,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1590/ 3125], loss: 0.183, per_step_time: 1414ms, lr: 9.498076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:23,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.65460 samples/s/p 3:03:34 } +2024-07-30 03:04:26,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1592/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 9.496567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:26,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.65969 samples/s/p 3:03:21 } +2024-07-30 03:04:29,521 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1594/ 3125], loss: 0.227, per_step_time: 1414ms, lr: 9.495055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:29,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.65391 samples/s/p 3:03:29 } +2024-07-30 03:04:32,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1596/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 9.49354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:32,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.65786 samples/s/p 3:03:19 } +2024-07-30 03:04:35,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1598/ 3125], loss: 0.253, per_step_time: 1414ms, lr: 9.492024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:35,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.65415 samples/s/p 3:03:23 } +2024-07-30 03:04:38,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1600/ 3125], loss: 0.272, per_step_time: 1414ms, lr: 9.490506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:38,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.65517 samples/s/p 3:03:18 } +2024-07-30 03:04:40,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1602/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 9.488986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:40,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.66042 samples/s/p 3:03:05 } +2024-07-30 03:04:43,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1604/ 3125], loss: 0.450, per_step_time: 1412ms, lr: 9.487463e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:43,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.66225 samples/s/p 3:02:59 } +2024-07-30 03:04:46,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1606/ 3125], loss: 0.407, per_step_time: 1413ms, lr: 9.485938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:46,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.66032 samples/s/p 3:03:00 } +2024-07-30 03:04:49,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1608/ 3125], loss: 0.170, per_step_time: 1414ms, lr: 9.484411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:49,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.65575 samples/s/p 3:03:06 } +2024-07-30 03:04:52,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1610/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 9.482882e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:52,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.65900 samples/s/p 3:02:57 } +2024-07-30 03:04:55,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1612/ 3125], loss: 0.373, per_step_time: 1414ms, lr: 9.48135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:55,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.65646 samples/s/p 3:02:59 } +2024-07-30 03:04:57,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1614/ 3125], loss: 0.432, per_step_time: 1412ms, lr: 9.479818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:57,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.66205 samples/s/p 3:02:45 } +2024-07-30 03:05:00,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1616/ 3125], loss: 0.367, per_step_time: 1413ms, lr: 9.478282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:00,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.65809 samples/s/p 3:02:50 } +2024-07-30 03:05:03,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1618/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 9.476745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:03,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.65893 samples/s/p 3:02:46 } +2024-07-30 03:05:06,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1620/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 9.475205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:06,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.66095 samples/s/p 3:02:39 } +2024-07-30 03:05:09,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1622/ 3125], loss: 0.099, per_step_time: 1413ms, lr: 9.473662e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:09,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.66040 samples/s/p 3:02:37 } +2024-07-30 03:05:12,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1624/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 9.472118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:12,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.66052 samples/s/p 3:02:34 } +2024-07-30 03:05:14,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1626/ 3125], loss: 0.237, per_step_time: 1412ms, lr: 9.470572e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:14,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.66236 samples/s/p 3:02:28 } +2024-07-30 03:05:17,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1628/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 9.469024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:17,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.66017 samples/s/p 3:02:29 } +2024-07-30 03:05:20,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1630/ 3125], loss: 0.332, per_step_time: 1412ms, lr: 9.467472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:20,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.66195 samples/s/p 3:02:23 } +2024-07-30 03:05:23,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1632/ 3125], loss: 0.266, per_step_time: 1412ms, lr: 9.465921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:23,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.66220 samples/s/p 3:02:19 } +2024-07-30 03:05:26,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1634/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 9.4643665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:26,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.65917 samples/s/p 3:02:22 } +2024-07-30 03:05:29,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1636/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 9.4628085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:29,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.66076 samples/s/p 3:02:17 } +2024-07-30 03:05:31,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1638/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 9.46125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:31,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.66042 samples/s/p 3:02:14 } +2024-07-30 03:05:34,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1640/ 3125], loss: 0.387, per_step_time: 1413ms, lr: 9.459689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:34,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.65888 samples/s/p 3:02:15 } +2024-07-30 03:05:37,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1642/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 9.4581255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:37,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.65859 samples/s/p 3:02:12 } +2024-07-30 03:05:40,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1644/ 3125], loss: 0.134, per_step_time: 1415ms, lr: 9.45656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:40,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.65230 samples/s/p 3:02:22 } +2024-07-30 03:05:43,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1646/ 3125], loss: 0.243, per_step_time: 1414ms, lr: 9.454992e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:43,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.65613 samples/s/p 3:02:11 } +2024-07-30 03:05:46,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1648/ 3125], loss: 0.133, per_step_time: 1414ms, lr: 9.453423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:46,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.65757 samples/s/p 3:02:06 } +2024-07-30 03:05:48,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1650/ 3125], loss: 0.204, per_step_time: 1415ms, lr: 9.451852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:48,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.65350 samples/s/p 3:02:11 } +2024-07-30 03:05:51,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1652/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 9.450278e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:51,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.65823 samples/s/p 3:01:59 } +2024-07-30 03:05:54,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1654/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 9.448701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:54,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.66168 samples/s/p 3:01:49 } +2024-07-30 03:05:57,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1656/ 3125], loss: 0.512, per_step_time: 1413ms, lr: 9.447123e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:57,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.66050 samples/s/p 3:01:49 } +2024-07-30 03:06:00,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1658/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 9.445543e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:00,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.65947 samples/s/p 3:01:48 } +2024-07-30 03:06:03,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1660/ 3125], loss: 0.321, per_step_time: 1413ms, lr: 9.443961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:03,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.66157 samples/s/p 3:01:41 } +2024-07-30 03:06:05,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1662/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 9.442376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:05,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.65888 samples/s/p 3:01:43 } +2024-07-30 03:06:08,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1664/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 9.44079e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:08,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.65856 samples/s/p 3:01:41 } +2024-07-30 03:06:11,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1666/ 3125], loss: 0.313, per_step_time: 1412ms, lr: 9.439201e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:11,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.66356 samples/s/p 3:01:29 } +2024-07-30 03:06:14,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1668/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 9.43761e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:14,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.65852 samples/s/p 3:01:36 } +2024-07-30 03:06:17,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1670/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 9.436017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:17,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.66108 samples/s/p 3:01:28 } +2024-07-30 03:06:20,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1672/ 3125], loss: 0.287, per_step_time: 1414ms, lr: 9.434422e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:20,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.65561 samples/s/p 3:01:36 } +2024-07-30 03:06:22,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1674/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 9.432824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:22,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.65873 samples/s/p 3:01:27 } +2024-07-30 03:06:25,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1676/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 9.431225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:25,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.66144 samples/s/p 3:01:19 } +2024-07-30 03:06:28,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1678/ 3125], loss: 0.519, per_step_time: 1413ms, lr: 9.429624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:28,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.66014 samples/s/p 3:01:18 } +2024-07-30 03:06:31,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1680/ 3125], loss: 0.228, per_step_time: 1414ms, lr: 9.42802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:31,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.65538 samples/s/p 3:01:25 } +2024-07-30 03:06:34,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1682/ 3125], loss: 0.395, per_step_time: 1414ms, lr: 9.426415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:34,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.65665 samples/s/p 3:01:19 } +2024-07-30 03:06:37,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1684/ 3125], loss: 0.156, per_step_time: 1414ms, lr: 9.424806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:37,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |████████ | 5.65768 samples/s/p 3:01:15 } +2024-07-30 03:06:39,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1686/ 3125], loss: 0.527, per_step_time: 1413ms, lr: 9.423197e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:39,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |████████ | 5.66169 samples/s/p 3:01:04 } +2024-07-30 03:06:42,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1688/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 9.421586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:42,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.66157 samples/s/p 3:01:02 } +2024-07-30 03:06:45,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1690/ 3125], loss: 0.398, per_step_time: 1413ms, lr: 9.419971e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:45,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.65997 samples/s/p 3:01:02 } +2024-07-30 03:06:48,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1692/ 3125], loss: 0.388, per_step_time: 1413ms, lr: 9.418355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:48,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.66042 samples/s/p 3:00:58 } +2024-07-30 03:06:51,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1694/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 9.416737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:51,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.66121 samples/s/p 3:00:54 } +2024-07-30 03:06:54,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1696/ 3125], loss: 0.180, per_step_time: 1412ms, lr: 9.415116e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:54,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.66185 samples/s/p 3:00:50 } +2024-07-30 03:06:56,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1698/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 9.413494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:56,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.65849 samples/s/p 3:00:53 } +2024-07-30 03:06:59,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1700/ 3125], loss: 0.333, per_step_time: 1414ms, lr: 9.411869e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:59,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.65647 samples/s/p 3:00:54 } +2024-07-30 03:07:02,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1702/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 9.410242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:02,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.66075 samples/s/p 3:00:43 } +2024-07-30 03:07:05,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1704/ 3125], loss: 0.429, per_step_time: 1414ms, lr: 9.408614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:05,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.65559 samples/s/p 3:00:50 } +2024-07-30 03:07:08,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1706/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 9.406983e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:08,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.66137 samples/s/p 3:00:36 } +2024-07-30 03:07:11,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1708/ 3125], loss: 0.098, per_step_time: 1414ms, lr: 9.4053485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:11,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.65672 samples/s/p 3:00:43 } +2024-07-30 03:07:13,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1710/ 3125], loss: 0.097, per_step_time: 1413ms, lr: 9.403714e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:13,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.66040 samples/s/p 3:00:33 } +2024-07-30 03:07:16,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1712/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 9.402076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:16,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.66117 samples/s/p 3:00:28 } +2024-07-30 03:07:19,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1714/ 3125], loss: 0.400, per_step_time: 1413ms, lr: 9.400437e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:19,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.65998 samples/s/p 3:00:28 } +2024-07-30 03:07:22,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1716/ 3125], loss: 0.209, per_step_time: 1412ms, lr: 9.398796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:22,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.66251 samples/s/p 3:00:20 } +2024-07-30 03:07:25,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1718/ 3125], loss: 0.398, per_step_time: 1413ms, lr: 9.397152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:25,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.66018 samples/s/p 3:00:22 } +2024-07-30 03:07:28,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1720/ 3125], loss: 0.358, per_step_time: 1414ms, lr: 9.395506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:28,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.65748 samples/s/p 3:00:24 } +2024-07-30 03:07:30,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1722/ 3125], loss: 0.214, per_step_time: 1414ms, lr: 9.393859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:30,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.65475 samples/s/p 3:00:27 } +2024-07-30 03:07:33,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1724/ 3125], loss: 0.141, per_step_time: 1414ms, lr: 9.392209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:33,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.65470 samples/s/p 3:00:24 } +2024-07-30 03:07:36,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1726/ 3125], loss: 0.149, per_step_time: 1415ms, lr: 9.390556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:36,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.65060 samples/s/p 3:00:29 } +2024-07-30 03:07:39,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1728/ 3125], loss: 0.275, per_step_time: 1414ms, lr: 9.388902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:39,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.65631 samples/s/p 3:00:15 } +2024-07-30 03:07:42,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1730/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 9.387246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:42,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.66136 samples/s/p 3:00:03 } +2024-07-30 03:07:45,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1732/ 3125], loss: 0.168, per_step_time: 1414ms, lr: 9.385587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:45,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.65566 samples/s/p 3:00:11 } +2024-07-30 03:07:47,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1734/ 3125], loss: 0.273, per_step_time: 1414ms, lr: 9.383927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:47,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.65607 samples/s/p 3:00:07 } +2024-07-30 03:07:50,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1736/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 9.382265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:50,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.66024 samples/s/p 2:59:56 } +2024-07-30 03:07:53,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1738/ 3125], loss: 0.343, per_step_time: 1414ms, lr: 9.380601e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:53,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.65689 samples/s/p 3:00:00 } +2024-07-30 03:07:56,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1740/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 9.378934e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:56,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.65967 samples/s/p 2:59:52 } +2024-07-30 03:07:59,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1742/ 3125], loss: 0.164, per_step_time: 1415ms, lr: 9.377265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:59,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.65335 samples/s/p 3:00:01 } +2024-07-30 03:08:02,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1744/ 3125], loss: 0.365, per_step_time: 1412ms, lr: 9.375594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:02,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.66241 samples/s/p 2:59:41 } +2024-07-30 03:08:04,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1746/ 3125], loss: 0.208, per_step_time: 1412ms, lr: 9.373922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:04,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.66247 samples/s/p 2:59:38 } +2024-07-30 03:08:07,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1748/ 3125], loss: 0.301, per_step_time: 1414ms, lr: 9.3722465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:07,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.65665 samples/s/p 2:59:46 } +2024-07-30 03:08:10,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1750/ 3125], loss: 0.379, per_step_time: 1413ms, lr: 9.3705685e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:10,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.66137 samples/s/p 2:59:34 } +2024-07-30 03:08:13,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1752/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 9.3688905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:13,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.66074 samples/s/p 2:59:33 } +2024-07-30 03:08:16,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1754/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 9.367209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:16,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.66058 samples/s/p 2:59:30 } +2024-07-30 03:08:19,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1756/ 3125], loss: 0.423, per_step_time: 1413ms, lr: 9.365525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:19,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.65787 samples/s/p 2:59:32 } +2024-07-30 03:08:21,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1758/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 9.363841e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:21,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.66043 samples/s/p 2:59:25 } +2024-07-30 03:08:24,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1760/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 9.362153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:24,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.66067 samples/s/p 2:59:21 } +2024-07-30 03:08:27,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1762/ 3125], loss: 0.590, per_step_time: 1413ms, lr: 9.360463e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:27,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.66137 samples/s/p 2:59:17 } +2024-07-30 03:08:30,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1764/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 9.358771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:30,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.65823 samples/s/p 2:59:20 } +2024-07-30 03:08:33,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1766/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 9.357077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:33,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.66074 samples/s/p 2:59:13 } +2024-07-30 03:08:36,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1768/ 3125], loss: 0.256, per_step_time: 1417ms, lr: 9.355382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:36,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.64216 samples/s/p 2:59:45 } +2024-07-30 03:08:38,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1770/ 3125], loss: 0.194, per_step_time: 1412ms, lr: 9.353684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:38,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.66250 samples/s/p 2:59:04 } +2024-07-30 03:08:41,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1772/ 3125], loss: 0.327, per_step_time: 1413ms, lr: 9.351984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:41,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.66085 samples/s/p 2:59:04 } +2024-07-30 03:08:44,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1774/ 3125], loss: 0.134, per_step_time: 1413ms, lr: 9.350281e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:44,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.66027 samples/s/p 2:59:02 } +2024-07-30 03:08:47,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1776/ 3125], loss: 0.391, per_step_time: 1413ms, lr: 9.348578e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:47,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.66169 samples/s/p 2:58:57 } +2024-07-30 03:08:50,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1778/ 3125], loss: 0.383, per_step_time: 1413ms, lr: 9.346872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:50,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.66102 samples/s/p 2:58:55 } +2024-07-30 03:08:53,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1780/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 9.345163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:53,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.66137 samples/s/p 2:58:52 } +2024-07-30 03:08:55,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1782/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 9.343452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:55,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.66104 samples/s/p 2:58:50 } +2024-07-30 03:08:58,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1784/ 3125], loss: 0.436, per_step_time: 1413ms, lr: 9.341739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:58,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.65927 samples/s/p 2:58:50 } +2024-07-30 03:09:01,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1786/ 3125], loss: 0.294, per_step_time: 1414ms, lr: 9.340025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:01,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.65521 samples/s/p 2:58:55 } +2024-07-30 03:09:04,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1788/ 3125], loss: 0.207, per_step_time: 1414ms, lr: 9.338309e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:04,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.65754 samples/s/p 2:58:48 } +2024-07-30 03:09:07,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1790/ 3125], loss: 0.432, per_step_time: 1413ms, lr: 9.33659e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:07,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.65933 samples/s/p 2:58:42 } +2024-07-30 03:09:10,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1792/ 3125], loss: 0.356, per_step_time: 1414ms, lr: 9.334869e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:10,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.65694 samples/s/p 2:58:43 } +2024-07-30 03:09:12,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1794/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 9.333146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:12,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.65867 samples/s/p 2:58:37 } +2024-07-30 03:09:15,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1796/ 3125], loss: 0.225, per_step_time: 1414ms, lr: 9.331422e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:15,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.65622 samples/s/p 2:58:39 } +2024-07-30 03:09:18,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1798/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 9.329694e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:18,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.65829 samples/s/p 2:58:32 } +2024-07-30 03:09:21,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1800/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 9.327966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:21,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.65782 samples/s/p 2:58:30 } +2024-07-30 03:09:24,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1802/ 3125], loss: 0.242, per_step_time: 1414ms, lr: 9.326234e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:24,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.65632 samples/s/p 2:58:30 } +2024-07-30 03:09:27,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1804/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 9.324502e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:27,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.66098 samples/s/p 2:58:19 } +2024-07-30 03:09:29,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1806/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 9.322765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:29,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.65964 samples/s/p 2:58:18 } +2024-07-30 03:09:32,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1808/ 3125], loss: 0.160, per_step_time: 1414ms, lr: 9.321029e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:32,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.65771 samples/s/p 2:58:19 } +2024-07-30 03:09:35,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1810/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 9.319289e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:35,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.65984 samples/s/p 2:58:12 } +2024-07-30 03:09:38,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1812/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 9.317549e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:38,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.65940 samples/s/p 2:58:10 } +2024-07-30 03:09:41,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1814/ 3125], loss: 0.236, per_step_time: 1412ms, lr: 9.315804e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:41,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.66208 samples/s/p 2:58:03 } +2024-07-30 03:09:44,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1816/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 9.314059e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:44,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.66041 samples/s/p 2:58:03 } +2024-07-30 03:09:46,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1818/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 9.312312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:46,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.65803 samples/s/p 2:58:04 } +2024-07-30 03:09:49,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1820/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 9.310561e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:49,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.66083 samples/s/p 2:57:56 } +2024-07-30 03:09:52,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1822/ 3125], loss: 0.357, per_step_time: 1413ms, lr: 9.30881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:52,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.66012 samples/s/p 2:57:55 } +2024-07-30 03:09:55,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1824/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 9.307057e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:55,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.66090 samples/s/p 2:57:51 } +2024-07-30 03:09:58,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1826/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 9.3053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:58,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.65938 samples/s/p 2:57:51 } +2024-07-30 03:10:01,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1828/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 9.303542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:01,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.66082 samples/s/p 2:57:45 } +2024-07-30 03:10:03,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1830/ 3125], loss: 0.334, per_step_time: 1413ms, lr: 9.3017825e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:03,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.66077 samples/s/p 2:57:42 } +2024-07-30 03:10:06,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1832/ 3125], loss: 0.160, per_step_time: 1414ms, lr: 9.300021e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:06,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.65509 samples/s/p 2:57:50 } +2024-07-30 03:10:09,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1834/ 3125], loss: 0.279, per_step_time: 1414ms, lr: 9.298256e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:09,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.65676 samples/s/p 2:57:44 } +2024-07-30 03:10:12,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1836/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 9.296491e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:12,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.66094 samples/s/p 2:57:34 } +2024-07-30 03:10:15,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1838/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 9.294722e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:15,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.66082 samples/s/p 2:57:31 } +2024-07-30 03:10:18,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1840/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 9.292952e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:18,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.66152 samples/s/p 2:57:27 } +2024-07-30 03:10:20,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1842/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 9.2911805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:20,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.66063 samples/s/p 2:57:26 } +2024-07-30 03:10:23,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1844/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 9.289406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:23,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.66091 samples/s/p 2:57:22 } +2024-07-30 03:10:26,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1846/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 9.28763e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:26,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.65917 samples/s/p 2:57:23 } +2024-07-30 03:10:29,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1848/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 9.285851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:29,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.65955 samples/s/p 2:57:19 } +2024-07-30 03:10:32,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1850/ 3125], loss: 0.507, per_step_time: 1413ms, lr: 9.28407e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:32,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.65889 samples/s/p 2:57:18 } +2024-07-30 03:10:35,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1852/ 3125], loss: 0.280, per_step_time: 1414ms, lr: 9.282288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:35,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.65566 samples/s/p 2:57:21 } +2024-07-30 03:10:37,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1854/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 9.280503e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:37,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.65829 samples/s/p 2:57:13 } +2024-07-30 03:10:40,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1856/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 9.278717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:40,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.66109 samples/s/p 2:57:05 } +2024-07-30 03:10:43,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1858/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 9.276928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:43,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.65816 samples/s/p 2:57:08 } +2024-07-30 03:10:46,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1860/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 9.275138e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:46,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.65901 samples/s/p 2:57:03 } +2024-07-30 03:10:49,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1862/ 3125], loss: 0.399, per_step_time: 1413ms, lr: 9.273345e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:49,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.66125 samples/s/p 2:56:56 } +2024-07-30 03:10:52,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1864/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 9.271551e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:52,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.66048 samples/s/p 2:56:55 } +2024-07-30 03:10:54,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1866/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 9.269754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:54,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.65996 samples/s/p 2:56:53 } +2024-07-30 03:10:57,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1868/ 3125], loss: 0.055, per_step_time: 1414ms, lr: 9.267955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:57,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.65444 samples/s/p 2:57:01 } +2024-07-30 03:11:00,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1870/ 3125], loss: 0.165, per_step_time: 1412ms, lr: 9.266154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:00,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.66187 samples/s/p 2:56:44 } +2024-07-30 03:11:03,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1872/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 9.264351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:03,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |█████████ | 5.65815 samples/s/p 2:56:48 } +2024-07-30 03:11:06,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1874/ 3125], loss: 0.366, per_step_time: 1414ms, lr: 9.262546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:06,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |█████████ | 5.65538 samples/s/p 2:56:50 } +2024-07-30 03:11:09,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1876/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 9.260739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:09,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.65851 samples/s/p 2:56:42 } +2024-07-30 03:11:11,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1878/ 3125], loss: 0.410, per_step_time: 1414ms, lr: 9.258931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:11,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.65439 samples/s/p 2:56:46 } +2024-07-30 03:11:14,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1880/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 9.257119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:14,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.66121 samples/s/p 2:56:31 } +2024-07-30 03:11:17,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1882/ 3125], loss: 0.195, per_step_time: 1414ms, lr: 9.255306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:17,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.65699 samples/s/p 2:56:36 } +2024-07-30 03:11:20,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1884/ 3125], loss: 0.320, per_step_time: 1415ms, lr: 9.253491e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:20,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.65265 samples/s/p 2:56:41 } +2024-07-30 03:11:23,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1886/ 3125], loss: 0.366, per_step_time: 1424ms, lr: 9.251674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:23,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.61561 samples/s/p 2:57:48 } +2024-07-30 03:11:26,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1888/ 3125], loss: 0.145, per_step_time: 1414ms, lr: 9.249855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:26,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.65620 samples/s/p 2:56:29 } +2024-07-30 03:11:29,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1890/ 3125], loss: 0.278, per_step_time: 1412ms, lr: 9.248033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:29,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.66175 samples/s/p 2:56:16 } +2024-07-30 03:11:31,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1892/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 9.24621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:31,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.65984 samples/s/p 2:56:16 } +2024-07-30 03:11:34,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1894/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 9.244384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:34,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.66106 samples/s/p 2:56:11 } +2024-07-30 03:11:37,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1896/ 3125], loss: 0.125, per_step_time: 1413ms, lr: 9.242558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:37,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.65951 samples/s/p 2:56:11 } +2024-07-30 03:11:40,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1898/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 9.240728e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:40,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.65787 samples/s/p 2:56:12 } +2024-07-30 03:11:43,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1900/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 9.238896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:43,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.66084 samples/s/p 2:56:03 } +2024-07-30 03:11:46,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1902/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 9.237063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:46,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.65916 samples/s/p 2:56:04 } +2024-07-30 03:11:48,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1904/ 3125], loss: 0.442, per_step_time: 1413ms, lr: 9.235228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:48,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.66033 samples/s/p 2:55:59 } +2024-07-30 03:11:51,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1906/ 3125], loss: 0.151, per_step_time: 1413ms, lr: 9.233391e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:51,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.66111 samples/s/p 2:55:54 } +2024-07-30 03:11:54,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1908/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 9.231551e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:54,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.66139 samples/s/p 2:55:51 } +2024-07-30 03:11:57,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1910/ 3125], loss: 0.381, per_step_time: 1413ms, lr: 9.22971e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:57,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.66076 samples/s/p 2:55:49 } +2024-07-30 03:12:00,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1912/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 9.227867e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:00,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.66065 samples/s/p 2:55:47 } +2024-07-30 03:12:03,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1914/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 9.226022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:03,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.66017 samples/s/p 2:55:45 } +2024-07-30 03:12:05,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1916/ 3125], loss: 0.279, per_step_time: 1412ms, lr: 9.2241735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:05,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.66215 samples/s/p 2:55:38 } +2024-07-30 03:12:08,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1918/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 9.222324e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:08,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.66019 samples/s/p 2:55:39 } +2024-07-30 03:12:11,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1920/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 9.220473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:11,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.65990 samples/s/p 2:55:37 } +2024-07-30 03:12:14,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1922/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 9.218618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:14,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.65994 samples/s/p 2:55:34 } +2024-07-30 03:12:17,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1924/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 9.216764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:17,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.66120 samples/s/p 2:55:29 } +2024-07-30 03:12:20,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1926/ 3125], loss: 0.110, per_step_time: 1413ms, lr: 9.214905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:20,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.66076 samples/s/p 2:55:27 } +2024-07-30 03:12:22,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1928/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 9.213046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:22,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.65816 samples/s/p 2:55:29 } +2024-07-30 03:12:25,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1930/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 9.211185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:25,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.66137 samples/s/p 2:55:20 } +2024-07-30 03:12:28,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1932/ 3125], loss: 0.282, per_step_time: 1414ms, lr: 9.209321e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:28,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.65467 samples/s/p 2:55:30 } +2024-07-30 03:12:31,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1934/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 9.207456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:31,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.65962 samples/s/p 2:55:18 } +2024-07-30 03:12:34,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1936/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 9.205588e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:34,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.65927 samples/s/p 2:55:15 } +2024-07-30 03:12:37,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1938/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 9.203719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:37,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.66016 samples/s/p 2:55:11 } +2024-07-30 03:12:39,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1940/ 3125], loss: 0.444, per_step_time: 1414ms, lr: 9.201847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:39,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.65530 samples/s/p 2:55:17 } +2024-07-30 03:12:42,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1942/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 9.199974e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:42,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.65682 samples/s/p 2:55:11 } +2024-07-30 03:12:45,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1944/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 9.198097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:45,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.66117 samples/s/p 2:55:01 } +2024-07-30 03:12:48,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1946/ 3125], loss: 0.379, per_step_time: 1413ms, lr: 9.19622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:48,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.65787 samples/s/p 2:55:04 } +2024-07-30 03:12:51,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1948/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 9.19434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:51,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.65901 samples/s/p 2:54:59 } +2024-07-30 03:12:54,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1950/ 3125], loss: 0.079, per_step_time: 1413ms, lr: 9.192459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:54,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.65887 samples/s/p 2:54:56 } +2024-07-30 03:12:56,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1952/ 3125], loss: 0.346, per_step_time: 1414ms, lr: 9.190576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:56,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.65574 samples/s/p 2:54:59 } +2024-07-30 03:12:59,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1954/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 9.18869e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:59,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.65847 samples/s/p 2:54:51 } +2024-07-30 03:13:02,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1956/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 9.186801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:02,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.65971 samples/s/p 2:54:46 } +2024-07-30 03:13:05,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1958/ 3125], loss: 0.354, per_step_time: 1412ms, lr: 9.184912e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:05,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.66317 samples/s/p 2:54:37 } +2024-07-30 03:13:08,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1960/ 3125], loss: 0.174, per_step_time: 1412ms, lr: 9.183021e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:08,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.66216 samples/s/p 2:54:36 } +2024-07-30 03:13:11,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1962/ 3125], loss: 0.341, per_step_time: 1414ms, lr: 9.181127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:11,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.65679 samples/s/p 2:54:43 } +2024-07-30 03:13:13,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1964/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 9.179231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:13,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.65996 samples/s/p 2:54:34 } +2024-07-30 03:13:16,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1966/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 9.1773345e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:16,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.66094 samples/s/p 2:54:30 } +2024-07-30 03:13:19,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1968/ 3125], loss: 0.075, per_step_time: 1413ms, lr: 9.175434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:19,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.65928 samples/s/p 2:54:30 } +2024-07-30 03:13:22,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1970/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 9.173533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:22,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.66077 samples/s/p 2:54:25 } +2024-07-30 03:13:25,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1972/ 3125], loss: 0.377, per_step_time: 1413ms, lr: 9.171628e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:25,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.66108 samples/s/p 2:54:21 } +2024-07-30 03:13:28,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1974/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 9.169723e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:28,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.66047 samples/s/p 2:54:19 } +2024-07-30 03:13:30,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1976/ 3125], loss: 0.135, per_step_time: 1412ms, lr: 9.167815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:30,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.66195 samples/s/p 2:54:14 } +2024-07-30 03:13:33,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1978/ 3125], loss: 0.148, per_step_time: 1414ms, lr: 9.165906e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:33,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.65608 samples/s/p 2:54:22 } +2024-07-30 03:13:36,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1980/ 3125], loss: 0.399, per_step_time: 1413ms, lr: 9.163994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:36,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.66040 samples/s/p 2:54:11 } +2024-07-30 03:13:39,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1982/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 9.1620805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:39,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.65801 samples/s/p 2:54:13 } +2024-07-30 03:13:42,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1984/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 9.160166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:42,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.66166 samples/s/p 2:54:03 } +2024-07-30 03:13:45,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1986/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 9.158248e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:45,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.66102 samples/s/p 2:54:01 } +2024-07-30 03:13:47,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1988/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 9.156328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:47,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.66032 samples/s/p 2:54:00 } +2024-07-30 03:13:50,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1990/ 3125], loss: 0.410, per_step_time: 1413ms, lr: 9.154406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:50,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.66124 samples/s/p 2:53:55 } +2024-07-30 03:13:53,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1992/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 9.1524835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:53,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.66069 samples/s/p 2:53:54 } +2024-07-30 03:13:56,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1994/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 9.150557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:56,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.66089 samples/s/p 2:53:50 } +2024-07-30 03:13:59,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1996/ 3125], loss: 0.112, per_step_time: 1413ms, lr: 9.14863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:59,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.66171 samples/s/p 2:53:46 } +2024-07-30 03:14:02,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1998/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 9.1467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:02,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.66077 samples/s/p 2:53:45 } +2024-07-30 03:14:04,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2000/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 9.144769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:04,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.66024 samples/s/p 2:53:43 } +2024-07-30 03:14:07,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2002/ 3125], loss: 0.148, per_step_time: 1413ms, lr: 9.1428365e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:07,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.65832 samples/s/p 2:53:44 } +2024-07-30 03:14:10,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2004/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 9.140901e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:10,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.65989 samples/s/p 2:53:38 } +2024-07-30 03:14:13,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2006/ 3125], loss: 0.178, per_step_time: 1412ms, lr: 9.138963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:13,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.66215 samples/s/p 2:53:31 } +2024-07-30 03:14:16,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2008/ 3125], loss: 0.285, per_step_time: 1415ms, lr: 9.137024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:16,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.65233 samples/s/p 2:53:46 } +2024-07-30 03:14:19,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2010/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 9.135083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:19,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.65884 samples/s/p 2:53:32 } +2024-07-30 03:14:21,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2012/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 9.1331385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:21,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.66144 samples/s/p 2:53:24 } +2024-07-30 03:14:24,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2014/ 3125], loss: 0.167, per_step_time: 1414ms, lr: 9.131193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:24,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.65564 samples/s/p 2:53:32 } +2024-07-30 03:14:27,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2016/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 9.129246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:27,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.65813 samples/s/p 2:53:24 } +2024-07-30 03:14:30,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2018/ 3125], loss: 0.382, per_step_time: 1414ms, lr: 9.127297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:30,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.65608 samples/s/p 2:53:25 } +2024-07-30 03:14:33,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2020/ 3125], loss: 0.444, per_step_time: 1412ms, lr: 9.125346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:33,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.66197 samples/s/p 2:53:12 } +2024-07-30 03:14:36,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2022/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 9.123393e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:36,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.65939 samples/s/p 2:53:14 } +2024-07-30 03:14:38,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2024/ 3125], loss: 0.321, per_step_time: 1414ms, lr: 9.121438e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:38,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.65613 samples/s/p 2:53:17 } +2024-07-30 03:14:41,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2026/ 3125], loss: 0.168, per_step_time: 1414ms, lr: 9.119481e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:41,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.65736 samples/s/p 2:53:12 } +2024-07-30 03:14:44,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2028/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 9.117522e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:44,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.65815 samples/s/p 2:53:07 } +2024-07-30 03:14:47,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2030/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 9.11556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:47,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.66088 samples/s/p 2:53:00 } +2024-07-30 03:14:50,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2032/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 9.113598e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:50,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.65822 samples/s/p 2:53:02 } +2024-07-30 03:14:53,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2034/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 9.1116335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:53,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.65846 samples/s/p 2:52:58 } +2024-07-30 03:14:55,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2036/ 3125], loss: 0.398, per_step_time: 1413ms, lr: 9.109666e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:55,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.66002 samples/s/p 2:52:53 } +2024-07-30 03:14:58,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2038/ 3125], loss: 0.288, per_step_time: 1414ms, lr: 9.107697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:58,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.65769 samples/s/p 2:52:54 } +2024-07-30 03:15:01,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2040/ 3125], loss: 0.238, per_step_time: 1414ms, lr: 9.105726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:01,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.65556 samples/s/p 2:52:55 } +2024-07-30 03:15:04,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2042/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 9.103754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:04,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.66092 samples/s/p 2:52:42 } +2024-07-30 03:15:07,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2044/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 9.101778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:07,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.65950 samples/s/p 2:52:42 } +2024-07-30 03:15:10,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2046/ 3125], loss: 0.397, per_step_time: 1413ms, lr: 9.099802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:10,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.66159 samples/s/p 2:52:36 } +2024-07-30 03:15:12,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2048/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 9.097823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:12,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.66121 samples/s/p 2:52:33 } +2024-07-30 03:15:15,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2050/ 3125], loss: 0.395, per_step_time: 1412ms, lr: 9.095843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:15,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.66174 samples/s/p 2:52:30 } +2024-07-30 03:15:18,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2052/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 9.09386e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:18,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.65817 samples/s/p 2:52:33 } +2024-07-30 03:15:21,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2054/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 9.091876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:21,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.66135 samples/s/p 2:52:25 } +2024-07-30 03:15:24,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2056/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 9.089889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:24,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.66012 samples/s/p 2:52:24 } +2024-07-30 03:15:27,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2058/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 9.0879e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:27,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.66076 samples/s/p 2:52:20 } +2024-07-30 03:15:29,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2060/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 9.08591e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:29,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.65877 samples/s/p 2:52:21 } +2024-07-30 03:15:32,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2062/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 9.0839185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:32,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.66121 samples/s/p 2:52:14 } +2024-07-30 03:15:35,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2064/ 3125], loss: 0.192, per_step_time: 1414ms, lr: 9.081924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:35,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |███████████ | 5.65512 samples/s/p 2:52:22 } +2024-07-30 03:15:38,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2066/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 9.079927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:38,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |███████████ | 5.65900 samples/s/p 2:52:12 } +2024-07-30 03:15:41,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2068/ 3125], loss: 0.349, per_step_time: 1414ms, lr: 9.0779295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:41,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.65688 samples/s/p 2:52:13 } +2024-07-30 03:15:44,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2070/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 9.0759295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:44,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.66142 samples/s/p 2:52:02 } +2024-07-30 03:15:46,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2072/ 3125], loss: 0.483, per_step_time: 1413ms, lr: 9.073927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:46,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.65826 samples/s/p 2:52:05 } +2024-07-30 03:15:49,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2074/ 3125], loss: 0.206, per_step_time: 1414ms, lr: 9.071923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:49,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.65412 samples/s/p 2:52:10 } +2024-07-30 03:15:52,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2076/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 9.069917e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:52,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.66007 samples/s/p 2:51:56 } +2024-07-30 03:15:55,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2078/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 9.06791e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:55,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.66159 samples/s/p 2:51:50 } +2024-07-30 03:15:58,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2080/ 3125], loss: 0.248, per_step_time: 1412ms, lr: 9.0659e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:58,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.66204 samples/s/p 2:51:47 } +2024-07-30 03:16:01,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2082/ 3125], loss: 0.082, per_step_time: 1414ms, lr: 9.063888e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:01,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.65645 samples/s/p 2:51:54 } +2024-07-30 03:16:03,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2084/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 9.061873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:03,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.65910 samples/s/p 2:51:46 } +2024-07-30 03:16:06,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2086/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 9.059858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:06,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.66051 samples/s/p 2:51:41 } +2024-07-30 03:16:09,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2088/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 9.0578405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:09,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.65858 samples/s/p 2:51:42 } +2024-07-30 03:16:12,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2090/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 9.0558215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:12,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.66166 samples/s/p 2:51:33 } +2024-07-30 03:16:15,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2092/ 3125], loss: 0.397, per_step_time: 1413ms, lr: 9.0538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:15,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.65986 samples/s/p 2:51:34 } +2024-07-30 03:16:18,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2094/ 3125], loss: 0.323, per_step_time: 1413ms, lr: 9.051776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:18,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.66099 samples/s/p 2:51:29 } +2024-07-30 03:16:20,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2096/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 9.049751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:20,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.66062 samples/s/p 2:51:27 } +2024-07-30 03:16:23,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2098/ 3125], loss: 0.217, per_step_time: 1414ms, lr: 9.047724e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:23,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.65553 samples/s/p 2:51:33 } +2024-07-30 03:16:26,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2100/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 9.045693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:26,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.65914 samples/s/p 2:51:24 } +2024-07-30 03:16:29,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2102/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 9.043662e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:29,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.66045 samples/s/p 2:51:19 } +2024-07-30 03:16:32,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2104/ 3125], loss: 0.235, per_step_time: 1414ms, lr: 9.04163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:32,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.65485 samples/s/p 2:51:26 } +2024-07-30 03:16:35,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2106/ 3125], loss: 0.336, per_step_time: 1412ms, lr: 9.039595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:35,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.66187 samples/s/p 2:51:10 } +2024-07-30 03:16:37,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2108/ 3125], loss: 0.154, per_step_time: 1414ms, lr: 9.037558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:37,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.65569 samples/s/p 2:51:19 } +2024-07-30 03:16:40,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2110/ 3125], loss: 0.134, per_step_time: 1412ms, lr: 9.035519e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:40,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.66254 samples/s/p 2:51:03 } +2024-07-30 03:16:43,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2112/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 9.033478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:43,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.65788 samples/s/p 2:51:09 } +2024-07-30 03:16:46,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2114/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 9.031435e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:46,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.65823 samples/s/p 2:51:06 } +2024-07-30 03:16:49,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2116/ 3125], loss: 0.236, per_step_time: 1412ms, lr: 9.029391e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:49,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.66240 samples/s/p 2:50:55 } +2024-07-30 03:16:52,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2118/ 3125], loss: 0.295, per_step_time: 1412ms, lr: 9.027343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:52,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.66194 samples/s/p 2:50:53 } +2024-07-30 03:16:54,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2120/ 3125], loss: 0.335, per_step_time: 1413ms, lr: 9.025296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:54,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.66087 samples/s/p 2:50:52 } +2024-07-30 03:16:57,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2122/ 3125], loss: 0.121, per_step_time: 1412ms, lr: 9.023245e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:57,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.66207 samples/s/p 2:50:47 } +2024-07-30 03:17:00,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2124/ 3125], loss: 0.057, per_step_time: 1413ms, lr: 9.021193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:00,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.65857 samples/s/p 2:50:51 } +2024-07-30 03:17:03,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2126/ 3125], loss: 0.319, per_step_time: 1412ms, lr: 9.019139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:03,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.66179 samples/s/p 2:50:42 } +2024-07-30 03:17:06,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2128/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 9.017082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:06,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.65947 samples/s/p 2:50:44 } +2024-07-30 03:17:09,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2130/ 3125], loss: 0.311, per_step_time: 1412ms, lr: 9.015024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:09,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.66240 samples/s/p 2:50:35 } +2024-07-30 03:17:11,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2132/ 3125], loss: 0.164, per_step_time: 1413ms, lr: 9.012964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:11,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.65923 samples/s/p 2:50:38 } +2024-07-30 03:17:14,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2134/ 3125], loss: 0.291, per_step_time: 1414ms, lr: 9.010902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:14,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.65768 samples/s/p 2:50:38 } +2024-07-30 03:17:17,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2136/ 3125], loss: 0.086, per_step_time: 1413ms, lr: 9.008838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:17,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.66043 samples/s/p 2:50:31 } +2024-07-30 03:17:20,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2138/ 3125], loss: 0.397, per_step_time: 1412ms, lr: 9.006773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:20,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.66231 samples/s/p 2:50:24 } +2024-07-30 03:17:23,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2140/ 3125], loss: 0.387, per_step_time: 1415ms, lr: 9.004705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:23,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.65071 samples/s/p 2:50:42 } +2024-07-30 03:17:26,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2142/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 9.002635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:26,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.66139 samples/s/p 2:50:20 } +2024-07-30 03:17:28,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2144/ 3125], loss: 0.336, per_step_time: 1415ms, lr: 9.000564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:28,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.65347 samples/s/p 2:50:32 } +2024-07-30 03:17:31,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2146/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 8.998491e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:31,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.66128 samples/s/p 2:50:15 } +2024-07-30 03:17:34,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2148/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 8.996415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:34,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.66086 samples/s/p 2:50:13 } +2024-07-30 03:17:37,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2150/ 3125], loss: 0.067, per_step_time: 1413ms, lr: 8.994339e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:37,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.66073 samples/s/p 2:50:10 } +2024-07-30 03:17:40,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2152/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 8.992258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:40,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.66092 samples/s/p 2:50:07 } +2024-07-30 03:17:43,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2154/ 3125], loss: 0.204, per_step_time: 1412ms, lr: 8.990178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:43,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.66201 samples/s/p 2:50:02 } +2024-07-30 03:17:45,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2156/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 8.988095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:45,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.65879 samples/s/p 2:50:05 } +2024-07-30 03:17:48,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2158/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 8.9860105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:48,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.65975 samples/s/p 2:50:01 } +2024-07-30 03:17:51,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2160/ 3125], loss: 0.406, per_step_time: 1412ms, lr: 8.983923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:51,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.66229 samples/s/p 2:49:53 } +2024-07-30 03:17:54,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2162/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 8.981835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:54,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.65987 samples/s/p 2:49:55 } +2024-07-30 03:17:57,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2164/ 3125], loss: 0.318, per_step_time: 1414ms, lr: 8.979744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:57,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.65575 samples/s/p 2:49:59 } +2024-07-30 03:18:00,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2166/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 8.977651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:00,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.66069 samples/s/p 2:49:48 } +2024-07-30 03:18:02,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2168/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 8.975558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:02,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.65880 samples/s/p 2:49:48 } +2024-07-30 03:18:05,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2170/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 8.973461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:05,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.66019 samples/s/p 2:49:43 } +2024-07-30 03:18:08,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2172/ 3125], loss: 0.114, per_step_time: 1413ms, lr: 8.971362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:08,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.65913 samples/s/p 2:49:42 } +2024-07-30 03:18:11,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2174/ 3125], loss: 0.497, per_step_time: 1413ms, lr: 8.969263e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:11,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.65904 samples/s/p 2:49:39 } +2024-07-30 03:18:14,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2176/ 3125], loss: 0.241, per_step_time: 1414ms, lr: 8.967161e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:14,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.65490 samples/s/p 2:49:44 } +2024-07-30 03:18:17,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2178/ 3125], loss: 0.211, per_step_time: 1414ms, lr: 8.9650575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:17,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.65658 samples/s/p 2:49:38 } +2024-07-30 03:18:19,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2180/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 8.962952e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:19,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.65781 samples/s/p 2:49:33 } +2024-07-30 03:18:22,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2182/ 3125], loss: 0.547, per_step_time: 1413ms, lr: 8.960844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:22,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.65919 samples/s/p 2:49:28 } +2024-07-30 03:18:25,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2184/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 8.958734e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:25,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.65771 samples/s/p 2:49:28 } +2024-07-30 03:18:28,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2186/ 3125], loss: 0.458, per_step_time: 1414ms, lr: 8.956623e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:28,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.65677 samples/s/p 2:49:26 } +2024-07-30 03:18:31,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2188/ 3125], loss: 0.372, per_step_time: 1414ms, lr: 8.954509e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:31,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.65628 samples/s/p 2:49:24 } +2024-07-30 03:18:34,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2190/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 8.952395e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:34,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.66099 samples/s/p 2:49:13 } +2024-07-30 03:18:36,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2192/ 3125], loss: 0.120, per_step_time: 1413ms, lr: 8.950277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:36,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.65986 samples/s/p 2:49:12 } +2024-07-30 03:18:39,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2194/ 3125], loss: 0.206, per_step_time: 1412ms, lr: 8.948158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:39,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.66181 samples/s/p 2:49:06 } +2024-07-30 03:18:42,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2196/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 8.946038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:42,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.65963 samples/s/p 2:49:07 } +2024-07-30 03:18:45,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2198/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 8.943915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:45,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.65966 samples/s/p 2:49:04 } +2024-07-30 03:18:48,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2200/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 8.94179e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:48,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.66164 samples/s/p 2:48:58 } +2024-07-30 03:18:51,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2202/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 8.939664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:51,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.66095 samples/s/p 2:48:56 } +2024-07-30 03:18:53,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2204/ 3125], loss: 0.249, per_step_time: 1415ms, lr: 8.937535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:53,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.65116 samples/s/p 2:49:11 } +2024-07-30 03:18:56,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2206/ 3125], loss: 0.207, per_step_time: 1412ms, lr: 8.935404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:56,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.66200 samples/s/p 2:48:49 } +2024-07-30 03:18:59,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2208/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 8.9332725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:59,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.65916 samples/s/p 2:48:51 } +2024-07-30 03:19:02,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2210/ 3125], loss: 0.392, per_step_time: 1412ms, lr: 8.931139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:02,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.66403 samples/s/p 2:48:40 } +2024-07-30 03:19:05,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2212/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 8.929003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:05,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.65841 samples/s/p 2:48:47 } +2024-07-30 03:19:08,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2214/ 3125], loss: 0.446, per_step_time: 1415ms, lr: 8.926866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:08,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.64990 samples/s/p 2:48:59 } +2024-07-30 03:19:10,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2216/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 8.924726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:10,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.65967 samples/s/p 2:48:39 } +2024-07-30 03:19:13,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2218/ 3125], loss: 0.239, per_step_time: 1412ms, lr: 8.922584e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:13,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.66171 samples/s/p 2:48:32 } +2024-07-30 03:19:16,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2220/ 3125], loss: 0.357, per_step_time: 1425ms, lr: 8.92044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:16,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.61291 samples/s/p 2:49:57 } +2024-07-30 03:19:19,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2222/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 8.918296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:19,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.66109 samples/s/p 2:48:28 } +2024-07-30 03:19:22,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2224/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 8.916148e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:22,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.66069 samples/s/p 2:48:26 } +2024-07-30 03:19:25,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2226/ 3125], loss: 0.207, per_step_time: 1412ms, lr: 8.913999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:25,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.66206 samples/s/p 2:48:20 } +2024-07-30 03:19:27,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2228/ 3125], loss: 0.122, per_step_time: 1413ms, lr: 8.911848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:27,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.66095 samples/s/p 2:48:20 } +2024-07-30 03:19:30,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2230/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 8.909696e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:30,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.65965 samples/s/p 2:48:19 } +2024-07-30 03:19:33,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2232/ 3125], loss: 0.463, per_step_time: 1413ms, lr: 8.907542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:33,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.65880 samples/s/p 2:48:18 } +2024-07-30 03:19:36,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2234/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 8.905385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:36,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.65795 samples/s/p 2:48:16 } +2024-07-30 03:19:39,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2236/ 3125], loss: 0.187, per_step_time: 1416ms, lr: 8.903226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:39,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.64644 samples/s/p 2:48:34 } +2024-07-30 03:19:42,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2238/ 3125], loss: 0.119, per_step_time: 1414ms, lr: 8.901066e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:42,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.65673 samples/s/p 2:48:13 } +2024-07-30 03:19:45,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2240/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 8.8989045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:45,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.65934 samples/s/p 2:48:05 } +2024-07-30 03:19:47,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2242/ 3125], loss: 0.383, per_step_time: 1413ms, lr: 8.896741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:47,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.66017 samples/s/p 2:48:01 } +2024-07-30 03:19:50,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2244/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 8.894574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:50,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.66024 samples/s/p 2:47:58 } +2024-07-30 03:19:53,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2246/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 8.892407e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:53,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |███████████ | 5.66066 samples/s/p 2:47:55 } +2024-07-30 03:19:56,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2248/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 8.890238e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:56,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |███████████ | 5.65999 samples/s/p 2:47:53 } +2024-07-30 03:19:59,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2250/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 8.888067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:59,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.66059 samples/s/p 2:47:49 } +2024-07-30 03:20:02,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2252/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 8.885892e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:02,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.66080 samples/s/p 2:47:46 } +2024-07-30 03:20:04,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2254/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 8.883718e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:04,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.66081 samples/s/p 2:47:43 } +2024-07-30 03:20:07,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2256/ 3125], loss: 0.274, per_step_time: 1415ms, lr: 8.881541e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:07,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.65355 samples/s/p 2:47:53 } +2024-07-30 03:20:10,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2258/ 3125], loss: 0.159, per_step_time: 1414ms, lr: 8.879362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:10,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.65757 samples/s/p 2:47:43 } +2024-07-30 03:20:13,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2260/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 8.877181e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:13,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.66017 samples/s/p 2:47:36 } +2024-07-30 03:20:16,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2262/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 8.874999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:16,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.66045 samples/s/p 2:47:32 } +2024-07-30 03:20:19,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2264/ 3125], loss: 0.264, per_step_time: 1414ms, lr: 8.872815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:19,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.65711 samples/s/p 2:47:36 } +2024-07-30 03:20:21,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2266/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 8.870629e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:21,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.66017 samples/s/p 2:47:27 } +2024-07-30 03:20:24,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2268/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.86844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:24,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.66048 samples/s/p 2:47:24 } +2024-07-30 03:20:27,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2270/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 8.86625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:27,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.66115 samples/s/p 2:47:20 } +2024-07-30 03:20:30,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2272/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 8.864059e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:30,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.65782 samples/s/p 2:47:23 } +2024-07-30 03:20:33,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2274/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 8.861865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:33,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.66154 samples/s/p 2:47:14 } +2024-07-30 03:20:36,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2276/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 8.85967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:36,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.65880 samples/s/p 2:47:16 } +2024-07-30 03:20:38,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2278/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 8.8574725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:38,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.66008 samples/s/p 2:47:10 } +2024-07-30 03:20:41,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2280/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 8.855273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:41,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.65824 samples/s/p 2:47:11 } +2024-07-30 03:20:44,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2282/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 8.853073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:44,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.66095 samples/s/p 2:47:03 } +2024-07-30 03:20:47,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2284/ 3125], loss: 0.197, per_step_time: 1414ms, lr: 8.85087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:47,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.65426 samples/s/p 2:47:12 } +2024-07-30 03:20:50,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2286/ 3125], loss: 0.174, per_step_time: 1414ms, lr: 8.848665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:50,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.65666 samples/s/p 2:47:05 } +2024-07-30 03:20:53,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2288/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 8.8464585e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:53,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.66102 samples/s/p 2:46:55 } +2024-07-30 03:20:55,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2290/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 8.84425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:55,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.66154 samples/s/p 2:46:51 } +2024-07-30 03:20:58,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2292/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 8.842041e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:58,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.65866 samples/s/p 2:46:53 } +2024-07-30 03:21:01,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2294/ 3125], loss: 0.151, per_step_time: 1414ms, lr: 8.839828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:01,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.65708 samples/s/p 2:46:53 } +2024-07-30 03:21:04,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2296/ 3125], loss: 0.295, per_step_time: 1414ms, lr: 8.837615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:04,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.65754 samples/s/p 2:46:50 } +2024-07-30 03:21:07,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2298/ 3125], loss: 0.244, per_step_time: 1414ms, lr: 8.835399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:07,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.65490 samples/s/p 2:46:51 } +2024-07-30 03:21:10,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2300/ 3125], loss: 0.378, per_step_time: 1415ms, lr: 8.833182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:10,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.65273 samples/s/p 2:46:52 } +2024-07-30 03:21:12,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2302/ 3125], loss: 0.556, per_step_time: 1413ms, lr: 8.8309625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:12,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.65857 samples/s/p 2:46:39 } +2024-07-30 03:21:15,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2304/ 3125], loss: 0.383, per_step_time: 1413ms, lr: 8.828741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:15,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.65971 samples/s/p 2:46:34 } +2024-07-30 03:21:18,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2306/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 8.826519e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:18,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.65772 samples/s/p 2:46:35 } +2024-07-30 03:21:21,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2308/ 3125], loss: 0.211, per_step_time: 1415ms, lr: 8.824293e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:21,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.65279 samples/s/p 2:46:41 } +2024-07-30 03:21:24,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2310/ 3125], loss: 0.327, per_step_time: 1412ms, lr: 8.822068e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:24,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.66204 samples/s/p 2:46:22 } +2024-07-30 03:21:27,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2312/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 8.8198385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:27,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.65927 samples/s/p 2:46:24 } +2024-07-30 03:21:29,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2314/ 3125], loss: 0.128, per_step_time: 1412ms, lr: 8.817608e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:29,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.66191 samples/s/p 2:46:16 } +2024-07-30 03:21:32,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2316/ 3125], loss: 0.142, per_step_time: 1412ms, lr: 8.8153765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:32,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.66207 samples/s/p 2:46:13 } +2024-07-30 03:21:35,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2318/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 8.813143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:35,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.66092 samples/s/p 2:46:12 } +2024-07-30 03:21:38,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2320/ 3125], loss: 0.192, per_step_time: 1412ms, lr: 8.810907e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:38,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.66258 samples/s/p 2:46:07 } +2024-07-30 03:21:41,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2322/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 8.808669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:41,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.66133 samples/s/p 2:46:06 } +2024-07-30 03:21:44,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2324/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.80643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:44,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.65972 samples/s/p 2:46:06 } +2024-07-30 03:21:46,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2326/ 3125], loss: 0.665, per_step_time: 1413ms, lr: 8.804189e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:46,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.66040 samples/s/p 2:46:02 } +2024-07-30 03:21:49,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2328/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 8.801945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:49,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.65885 samples/s/p 2:46:02 } +2024-07-30 03:21:52,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2330/ 3125], loss: 0.517, per_step_time: 1413ms, lr: 8.7997005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:52,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.65884 samples/s/p 2:45:59 } +2024-07-30 03:21:55,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2332/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 8.797455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:55,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.66003 samples/s/p 2:45:54 } +2024-07-30 03:21:58,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2334/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 8.795207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:58,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.66033 samples/s/p 2:45:51 } +2024-07-30 03:22:01,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2336/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 8.792956e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:01,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.65986 samples/s/p 2:45:49 } +2024-07-30 03:22:03,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2338/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 8.790704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:03,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.65977 samples/s/p 2:45:46 } +2024-07-30 03:22:06,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2340/ 3125], loss: 0.059, per_step_time: 1412ms, lr: 8.788449e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:06,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.66189 samples/s/p 2:45:40 } +2024-07-30 03:22:09,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2342/ 3125], loss: 0.110, per_step_time: 1412ms, lr: 8.7861945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:09,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.66172 samples/s/p 2:45:37 } +2024-07-30 03:22:12,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2344/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 8.783937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:12,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.66157 samples/s/p 2:45:35 } +2024-07-30 03:22:15,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2346/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 8.781677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:15,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.66133 samples/s/p 2:45:32 } +2024-07-30 03:22:18,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2348/ 3125], loss: 0.086, per_step_time: 1413ms, lr: 8.779416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:18,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.65863 samples/s/p 2:45:34 } +2024-07-30 03:22:20,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2350/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 8.777153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:20,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.65851 samples/s/p 2:45:31 } +2024-07-30 03:22:23,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2352/ 3125], loss: 0.291, per_step_time: 1413ms, lr: 8.774889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:23,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.66125 samples/s/p 2:45:24 } +2024-07-30 03:22:26,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2354/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 8.772622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:26,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.65873 samples/s/p 2:45:25 } +2024-07-30 03:22:29,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2356/ 3125], loss: 0.190, per_step_time: 1414ms, lr: 8.770355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:29,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.65681 samples/s/p 2:45:26 } +2024-07-30 03:22:32,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2358/ 3125], loss: 0.312, per_step_time: 1415ms, lr: 8.768084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:32,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.65293 samples/s/p 2:45:30 } +2024-07-30 03:22:35,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2360/ 3125], loss: 0.515, per_step_time: 1413ms, lr: 8.765812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:35,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.66123 samples/s/p 2:45:13 } +2024-07-30 03:22:37,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2362/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 8.763538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:37,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.65830 samples/s/p 2:45:15 } +2024-07-30 03:22:40,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2364/ 3125], loss: 0.183, per_step_time: 1419ms, lr: 8.7612625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:40,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.63732 samples/s/p 2:45:49 } +2024-07-30 03:22:43,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2366/ 3125], loss: 0.127, per_step_time: 1413ms, lr: 8.758985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:43,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.66098 samples/s/p 2:45:04 } +2024-07-30 03:22:46,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2368/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 8.756707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:46,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.65841 samples/s/p 2:45:06 } +2024-07-30 03:22:49,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2370/ 3125], loss: 0.141, per_step_time: 1413ms, lr: 8.754426e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:49,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.65977 samples/s/p 2:45:01 } +2024-07-30 03:22:52,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2372/ 3125], loss: 0.340, per_step_time: 1414ms, lr: 8.752143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:52,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.65586 samples/s/p 2:45:05 } +2024-07-30 03:22:54,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2374/ 3125], loss: 0.473, per_step_time: 1417ms, lr: 8.749858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:54,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.64314 samples/s/p 2:45:24 } +2024-07-30 03:22:57,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2376/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 8.747572e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:57,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.66027 samples/s/p 2:44:52 } +2024-07-30 03:23:00,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2378/ 3125], loss: 0.094, per_step_time: 1413ms, lr: 8.745284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:00,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.65831 samples/s/p 2:44:52 } +2024-07-30 03:23:03,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2380/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 8.7429935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:03,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.65780 samples/s/p 2:44:50 } +2024-07-30 03:23:06,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2382/ 3125], loss: 0.261, per_step_time: 1412ms, lr: 8.7407025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:06,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.66319 samples/s/p 2:44:38 } +2024-07-30 03:23:09,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2384/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 8.738409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:09,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.66000 samples/s/p 2:44:41 } +2024-07-30 03:23:11,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2386/ 3125], loss: 0.167, per_step_time: 1412ms, lr: 8.736114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:11,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.66307 samples/s/p 2:44:33 } +2024-07-30 03:23:14,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2388/ 3125], loss: 0.389, per_step_time: 1412ms, lr: 8.733817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:14,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.66188 samples/s/p 2:44:32 } +2024-07-30 03:23:17,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2390/ 3125], loss: 0.474, per_step_time: 1412ms, lr: 8.731518e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:17,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.66184 samples/s/p 2:44:29 } +2024-07-30 03:23:20,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2392/ 3125], loss: 0.226, per_step_time: 1412ms, lr: 8.729217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:20,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.66242 samples/s/p 2:44:25 } +2024-07-30 03:23:23,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2394/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 8.726915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:23,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.66073 samples/s/p 2:44:25 } +2024-07-30 03:23:26,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2396/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 8.724612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:26,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.65923 samples/s/p 2:44:25 } +2024-07-30 03:23:28,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2398/ 3125], loss: 0.353, per_step_time: 1413ms, lr: 8.722305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:28,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.66072 samples/s/p 2:44:20 } +2024-07-30 03:23:31,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2400/ 3125], loss: 0.117, per_step_time: 1414ms, lr: 8.719997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:31,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.65739 samples/s/p 2:44:23 } +2024-07-30 03:23:34,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2402/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 8.717688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:34,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.66033 samples/s/p 2:44:15 } +2024-07-30 03:23:37,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2404/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 8.715378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:37,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.65984 samples/s/p 2:44:13 } +2024-07-30 03:23:40,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2406/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 8.713065e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:40,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.66108 samples/s/p 2:44:08 } +2024-07-30 03:23:43,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2408/ 3125], loss: 0.264, per_step_time: 1415ms, lr: 8.710749e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:43,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.65097 samples/s/p 2:44:23 } +2024-07-30 03:23:45,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2410/ 3125], loss: 0.300, per_step_time: 1412ms, lr: 8.708433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:45,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.66276 samples/s/p 2:43:59 } +2024-07-30 03:23:48,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2412/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 8.706115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:48,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.66035 samples/s/p 2:44:01 } +2024-07-30 03:23:51,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2414/ 3125], loss: 0.315, per_step_time: 1412ms, lr: 8.703795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:51,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.66206 samples/s/p 2:43:55 } +2024-07-30 03:23:54,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2416/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 8.701472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:54,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.66049 samples/s/p 2:43:55 } +2024-07-30 03:23:57,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2418/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 8.699149e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:57,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.66123 samples/s/p 2:43:51 } +2024-07-30 03:24:00,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2420/ 3125], loss: 0.363, per_step_time: 1413ms, lr: 8.696824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:00,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.65944 samples/s/p 2:43:51 } +2024-07-30 03:24:02,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2422/ 3125], loss: 0.210, per_step_time: 1414ms, lr: 8.694497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:02,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.65424 samples/s/p 2:43:57 } +2024-07-30 03:24:05,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2424/ 3125], loss: 0.583, per_step_time: 1413ms, lr: 8.692168e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:05,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.65839 samples/s/p 2:43:47 } +2024-07-30 03:24:08,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2426/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 8.689837e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:08,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.65963 samples/s/p 2:43:42 } +2024-07-30 03:24:11,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2428/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 8.687505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:11,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.66082 samples/s/p 2:43:37 } +2024-07-30 03:24:14,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2430/ 3125], loss: 0.241, per_step_time: 1412ms, lr: 8.6851705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:14,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.66228 samples/s/p 2:43:32 } +2024-07-30 03:24:17,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2432/ 3125], loss: 0.409, per_step_time: 1415ms, lr: 8.682835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:17,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.65323 samples/s/p 2:43:45 } +2024-07-30 03:24:19,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2434/ 3125], loss: 0.359, per_step_time: 1412ms, lr: 8.680497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:19,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |████████████ | 5.66204 samples/s/p 2:43:27 } +2024-07-30 03:24:22,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2436/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 8.678157e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:22,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |████████████ | 5.65969 samples/s/p 2:43:28 } +2024-07-30 03:24:25,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2438/ 3125], loss: 0.460, per_step_time: 1414ms, lr: 8.675816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:25,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.65598 samples/s/p 2:43:31 } +2024-07-30 03:24:28,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2440/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 8.6734735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:28,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.65945 samples/s/p 2:43:23 } +2024-07-30 03:24:31,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2442/ 3125], loss: 0.319, per_step_time: 1414ms, lr: 8.671129e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:31,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.65765 samples/s/p 2:43:23 } +2024-07-30 03:24:34,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2444/ 3125], loss: 0.472, per_step_time: 1413ms, lr: 8.668782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:34,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.66110 samples/s/p 2:43:14 } +2024-07-30 03:24:36,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2446/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 8.666434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:36,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.65853 samples/s/p 2:43:16 } +2024-07-30 03:24:39,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2448/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 8.664085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:39,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.65996 samples/s/p 2:43:10 } +2024-07-30 03:24:42,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2450/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 8.661733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:42,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.66066 samples/s/p 2:43:06 } +2024-07-30 03:24:45,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2452/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 8.659379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:45,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.65952 samples/s/p 2:43:05 } +2024-07-30 03:24:48,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2454/ 3125], loss: 0.155, per_step_time: 1414ms, lr: 8.6570235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:48,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.65541 samples/s/p 2:43:10 } +2024-07-30 03:24:51,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2456/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 8.654667e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:51,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.66129 samples/s/p 2:42:57 } +2024-07-30 03:24:53,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2458/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 8.652309e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:53,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.65918 samples/s/p 2:42:58 } +2024-07-30 03:24:56,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2460/ 3125], loss: 0.457, per_step_time: 1413ms, lr: 8.649948e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:56,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.66085 samples/s/p 2:42:52 } +2024-07-30 03:24:59,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2462/ 3125], loss: 0.426, per_step_time: 1413ms, lr: 8.647586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:59,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.66036 samples/s/p 2:42:50 } +2024-07-30 03:25:02,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2464/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 8.645222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:02,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.66097 samples/s/p 2:42:46 } +2024-07-30 03:25:05,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2466/ 3125], loss: 0.425, per_step_time: 1412ms, lr: 8.642855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:05,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.66268 samples/s/p 2:42:40 } +2024-07-30 03:25:08,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2468/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 8.640488e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:08,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.65828 samples/s/p 2:42:45 } +2024-07-30 03:25:10,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2470/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 8.638119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:10,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.65787 samples/s/p 2:42:43 } +2024-07-30 03:25:13,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2472/ 3125], loss: 0.181, per_step_time: 1414ms, lr: 8.635749e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:13,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.65691 samples/s/p 2:42:42 } +2024-07-30 03:25:16,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2474/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 8.633376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:16,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.65959 samples/s/p 2:42:34 } +2024-07-30 03:25:19,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2476/ 3125], loss: 0.425, per_step_time: 1414ms, lr: 8.631002e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:19,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.65513 samples/s/p 2:42:39 } +2024-07-30 03:25:22,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2478/ 3125], loss: 0.303, per_step_time: 1414ms, lr: 8.628625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:22,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.65768 samples/s/p 2:42:32 } +2024-07-30 03:25:25,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2480/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 8.626247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:25,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.65961 samples/s/p 2:42:26 } +2024-07-30 03:25:27,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2482/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 8.623868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:27,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.66126 samples/s/p 2:42:20 } +2024-07-30 03:25:30,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2484/ 3125], loss: 0.112, per_step_time: 1412ms, lr: 8.621487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:30,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.66190 samples/s/p 2:42:16 } +2024-07-30 03:25:33,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2486/ 3125], loss: 0.228, per_step_time: 1412ms, lr: 8.619103e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:33,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.66195 samples/s/p 2:42:13 } +2024-07-30 03:25:36,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2488/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 8.616719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:36,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.65806 samples/s/p 2:42:17 } +2024-07-30 03:25:39,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2490/ 3125], loss: 0.282, per_step_time: 1412ms, lr: 8.614333e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:39,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.66187 samples/s/p 2:42:08 } +2024-07-30 03:25:42,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2492/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 8.611944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:42,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.65858 samples/s/p 2:42:11 } +2024-07-30 03:25:44,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2494/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 8.609554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:44,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.65981 samples/s/p 2:42:06 } +2024-07-30 03:25:47,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2496/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 8.607162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:47,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.65962 samples/s/p 2:42:03 } +2024-07-30 03:25:50,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2498/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.6047685e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:50,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.65907 samples/s/p 2:42:01 } +2024-07-30 03:25:53,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2500/ 3125], loss: 0.103, per_step_time: 1413ms, lr: 8.602375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:53,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.66055 samples/s/p 2:41:56 } +2024-07-30 03:25:56,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2502/ 3125], loss: 0.338, per_step_time: 1414ms, lr: 8.599976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:56,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.65590 samples/s/p 2:42:01 } +2024-07-30 03:25:59,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2504/ 3125], loss: 0.336, per_step_time: 1414ms, lr: 8.597579e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:59,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.65699 samples/s/p 2:41:56 } +2024-07-30 03:26:01,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2506/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 8.595178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:01,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.66079 samples/s/p 2:41:47 } +2024-07-30 03:26:04,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2508/ 3125], loss: 0.387, per_step_time: 1413ms, lr: 8.592777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:04,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.66075 samples/s/p 2:41:44 } +2024-07-30 03:26:07,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2510/ 3125], loss: 0.373, per_step_time: 1413ms, lr: 8.590373e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:07,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.66082 samples/s/p 2:41:41 } +2024-07-30 03:26:10,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2512/ 3125], loss: 0.230, per_step_time: 1416ms, lr: 8.587968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:10,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.64776 samples/s/p 2:42:01 } +2024-07-30 03:26:13,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2514/ 3125], loss: 0.258, per_step_time: 1415ms, lr: 8.58556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:13,310 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.65341 samples/s/p 2:41:48 } +2024-07-30 03:26:16,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2516/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 8.5831525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:16,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.66023 samples/s/p 2:41:34 } +2024-07-30 03:26:18,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2518/ 3125], loss: 0.340, per_step_time: 1414ms, lr: 8.580741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:18,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.65703 samples/s/p 2:41:36 } +2024-07-30 03:26:21,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2520/ 3125], loss: 0.080, per_step_time: 1413ms, lr: 8.578329e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:21,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.65976 samples/s/p 2:41:29 } +2024-07-30 03:26:24,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2522/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 8.575915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:24,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.65982 samples/s/p 2:41:26 } +2024-07-30 03:26:27,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2524/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 8.573499e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:27,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.66018 samples/s/p 2:41:23 } +2024-07-30 03:26:30,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2526/ 3125], loss: 0.306, per_step_time: 1412ms, lr: 8.571082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:30,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.66202 samples/s/p 2:41:17 } +2024-07-30 03:26:33,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2528/ 3125], loss: 0.300, per_step_time: 1414ms, lr: 8.568663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:33,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.65661 samples/s/p 2:41:23 } +2024-07-30 03:26:35,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2530/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 8.566242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:35,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.65924 samples/s/p 2:41:16 } +2024-07-30 03:26:38,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2532/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 8.563819e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:38,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.65887 samples/s/p 2:41:14 } +2024-07-30 03:26:41,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2534/ 3125], loss: 0.080, per_step_time: 1412ms, lr: 8.561396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:41,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.66232 samples/s/p 2:41:05 } +2024-07-30 03:26:44,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2536/ 3125], loss: 0.029, per_step_time: 1412ms, lr: 8.55897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:44,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.66202 samples/s/p 2:41:02 } +2024-07-30 03:26:47,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2538/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 8.556542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:47,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.66080 samples/s/p 2:41:02 } +2024-07-30 03:26:50,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2540/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 8.554112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:50,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.65995 samples/s/p 2:41:00 } +2024-07-30 03:26:52,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2542/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 8.551682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:52,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.65997 samples/s/p 2:40:58 } +2024-07-30 03:26:55,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2544/ 3125], loss: 0.513, per_step_time: 1412ms, lr: 8.549249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:55,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.66238 samples/s/p 2:40:51 } +2024-07-30 03:26:58,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2546/ 3125], loss: 0.527, per_step_time: 1413ms, lr: 8.546815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:58,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.66077 samples/s/p 2:40:50 } +2024-07-30 03:27:01,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2548/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 8.544379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:01,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.66062 samples/s/p 2:40:48 } +2024-07-30 03:27:04,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2550/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 8.541941e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:04,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.65944 samples/s/p 2:40:47 } +2024-07-30 03:27:07,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2552/ 3125], loss: 0.393, per_step_time: 1413ms, lr: 8.539501e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:07,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.65926 samples/s/p 2:40:45 } +2024-07-30 03:27:09,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2554/ 3125], loss: 0.224, per_step_time: 1412ms, lr: 8.537061e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:09,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.66174 samples/s/p 2:40:38 } +2024-07-30 03:27:12,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2556/ 3125], loss: 0.344, per_step_time: 1415ms, lr: 8.534618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:12,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.65362 samples/s/p 2:40:49 } +2024-07-30 03:27:15,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2558/ 3125], loss: 0.511, per_step_time: 1414ms, lr: 8.532173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:15,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.65564 samples/s/p 2:40:42 } +2024-07-30 03:27:18,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2560/ 3125], loss: 0.267, per_step_time: 1414ms, lr: 8.529727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:18,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.65610 samples/s/p 2:40:39 } +2024-07-30 03:27:21,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2562/ 3125], loss: 0.235, per_step_time: 1413ms, lr: 8.5272795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:21,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.65943 samples/s/p 2:40:30 } +2024-07-30 03:27:24,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2564/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 8.52483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:24,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.65907 samples/s/p 2:40:28 } +2024-07-30 03:27:26,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2566/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 8.522378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:26,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.65867 samples/s/p 2:40:26 } +2024-07-30 03:27:29,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2568/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 8.519925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:29,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.66024 samples/s/p 2:40:20 } +2024-07-30 03:27:32,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2570/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 8.517471e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:32,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.66055 samples/s/p 2:40:17 } +2024-07-30 03:27:35,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2572/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 8.515014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:35,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.65924 samples/s/p 2:40:16 } +2024-07-30 03:27:38,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2574/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 8.512557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:38,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.65958 samples/s/p 2:40:13 } +2024-07-30 03:27:41,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2576/ 3125], loss: 0.606, per_step_time: 1414ms, lr: 8.510097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:41,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.65483 samples/s/p 2:40:18 } +2024-07-30 03:27:43,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2578/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 8.507635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:44,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.65924 samples/s/p 2:40:08 } +2024-07-30 03:27:46,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2580/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 8.505172e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:46,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.66031 samples/s/p 2:40:03 } +2024-07-30 03:27:49,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2582/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 8.502709e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:49,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.66145 samples/s/p 2:39:58 } +2024-07-30 03:27:52,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2584/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 8.500242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:52,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.66029 samples/s/p 2:39:58 } +2024-07-30 03:27:55,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2586/ 3125], loss: 0.349, per_step_time: 1414ms, lr: 8.497773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:55,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.65717 samples/s/p 2:40:00 } +2024-07-30 03:27:58,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2588/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 8.495304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:58,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.66030 samples/s/p 2:39:52 } +2024-07-30 03:28:01,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2590/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 8.492833e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:01,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.65910 samples/s/p 2:39:51 } +2024-07-30 03:28:03,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2592/ 3125], loss: 0.391, per_step_time: 1413ms, lr: 8.4903595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:03,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.66068 samples/s/p 2:39:46 } +2024-07-30 03:28:06,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2594/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 8.487885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:06,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.66000 samples/s/p 2:39:44 } +2024-07-30 03:28:09,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2596/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.485409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:09,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.66102 samples/s/p 2:39:39 } +2024-07-30 03:28:12,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2598/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 8.482931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:12,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.66081 samples/s/p 2:39:37 } +2024-07-30 03:28:15,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2600/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 8.480451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:15,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.65896 samples/s/p 2:39:37 } +2024-07-30 03:28:18,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2602/ 3125], loss: 0.205, per_step_time: 1414ms, lr: 8.477969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:18,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.65693 samples/s/p 2:39:38 } +2024-07-30 03:28:20,840 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2604/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 8.4754865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:20,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.65900 samples/s/p 2:39:32 } +2024-07-30 03:28:23,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2606/ 3125], loss: 0.323, per_step_time: 1424ms, lr: 8.473002e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:23,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.61585 samples/s/p 2:40:42 } +2024-07-30 03:28:26,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2608/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 8.470515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:26,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.66054 samples/s/p 2:39:23 } +2024-07-30 03:28:29,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2610/ 3125], loss: 0.296, per_step_time: 1412ms, lr: 8.468027e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:29,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.66254 samples/s/p 2:39:17 } +2024-07-30 03:28:32,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2612/ 3125], loss: 0.131, per_step_time: 1414ms, lr: 8.465538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:32,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.65713 samples/s/p 2:39:23 } +2024-07-30 03:28:35,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2614/ 3125], loss: 0.263, per_step_time: 1414ms, lr: 8.4630465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:35,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.65754 samples/s/p 2:39:20 } +2024-07-30 03:28:37,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2616/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 8.4605535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:37,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.65775 samples/s/p 2:39:17 } +2024-07-30 03:28:40,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2618/ 3125], loss: 0.273, per_step_time: 1412ms, lr: 8.45806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:40,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.66209 samples/s/p 2:39:06 } +2024-07-30 03:28:43,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2620/ 3125], loss: 0.403, per_step_time: 1414ms, lr: 8.455562e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:43,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.65733 samples/s/p 2:39:12 } +2024-07-30 03:28:46,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2622/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 8.453065e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:46,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |█████████████ | 5.65820 samples/s/p 2:39:07 } +2024-07-30 03:28:49,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2624/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 8.4505655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:49,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |█████████████ | 5.66129 samples/s/p 2:38:59 } +2024-07-30 03:28:52,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2626/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 8.448064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:52,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.66119 samples/s/p 2:38:57 } +2024-07-30 03:28:54,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2628/ 3125], loss: 0.112, per_step_time: 1414ms, lr: 8.445561e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:54,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.65584 samples/s/p 2:39:03 } +2024-07-30 03:28:57,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2630/ 3125], loss: 0.297, per_step_time: 1412ms, lr: 8.443058e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:57,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.66177 samples/s/p 2:38:50 } +2024-07-30 03:29:00,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2632/ 3125], loss: 0.303, per_step_time: 1414ms, lr: 8.440551e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:00,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.65432 samples/s/p 2:39:00 } +2024-07-30 03:29:03,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2634/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.438044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:03,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.65997 samples/s/p 2:38:47 } +2024-07-30 03:29:06,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2636/ 3125], loss: 0.294, per_step_time: 1412ms, lr: 8.435534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:06,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.66172 samples/s/p 2:38:42 } +2024-07-30 03:29:09,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2638/ 3125], loss: 0.058, per_step_time: 1413ms, lr: 8.433022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:09,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.65878 samples/s/p 2:38:44 } +2024-07-30 03:29:11,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2640/ 3125], loss: 0.218, per_step_time: 1412ms, lr: 8.43051e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:11,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.66281 samples/s/p 2:38:34 } +2024-07-30 03:29:14,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2642/ 3125], loss: 0.335, per_step_time: 1413ms, lr: 8.427995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:14,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.66036 samples/s/p 2:38:35 } +2024-07-30 03:29:17,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2644/ 3125], loss: 0.282, per_step_time: 1416ms, lr: 8.425479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:17,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.64651 samples/s/p 2:38:56 } +2024-07-30 03:29:20,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2646/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 8.422962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:20,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.65800 samples/s/p 2:38:34 } +2024-07-30 03:29:23,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2648/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 8.420443e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:23,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.65908 samples/s/p 2:38:29 } +2024-07-30 03:29:26,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2650/ 3125], loss: 0.492, per_step_time: 1414ms, lr: 8.417922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:26,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.65730 samples/s/p 2:38:29 } +2024-07-30 03:29:28,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2652/ 3125], loss: 0.169, per_step_time: 1415ms, lr: 8.4154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:28,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.65059 samples/s/p 2:38:38 } +2024-07-30 03:29:31,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2654/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 8.412875e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:31,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.65812 samples/s/p 2:38:22 } +2024-07-30 03:29:34,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2656/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 8.410349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:34,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.66079 samples/s/p 2:38:15 } +2024-07-30 03:29:37,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2658/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 8.407823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:37,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.66046 samples/s/p 2:38:13 } +2024-07-30 03:29:40,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2660/ 3125], loss: 0.666, per_step_time: 1413ms, lr: 8.405293e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:40,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.66063 samples/s/p 2:38:10 } +2024-07-30 03:29:43,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2662/ 3125], loss: 0.224, per_step_time: 1414ms, lr: 8.402762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:43,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.65728 samples/s/p 2:38:12 } +2024-07-30 03:29:45,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2664/ 3125], loss: 0.433, per_step_time: 1413ms, lr: 8.40023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:45,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.65976 samples/s/p 2:38:05 } +2024-07-30 03:29:48,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2666/ 3125], loss: 0.185, per_step_time: 1414ms, lr: 8.397697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:48,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.65758 samples/s/p 2:38:06 } +2024-07-30 03:29:51,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2668/ 3125], loss: 0.216, per_step_time: 1414ms, lr: 8.395162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:51,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.65457 samples/s/p 2:38:08 } +2024-07-30 03:29:54,405 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2670/ 3125], loss: 0.426, per_step_time: 1413ms, lr: 8.392624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:54,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.65789 samples/s/p 2:38:00 } +2024-07-30 03:29:57,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2672/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 8.390086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:57,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.65972 samples/s/p 2:37:54 } +2024-07-30 03:30:00,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2674/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 8.387545e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:00,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.66135 samples/s/p 2:37:49 } +2024-07-30 03:30:02,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2676/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 8.385003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:02,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.66143 samples/s/p 2:37:46 } +2024-07-30 03:30:05,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2678/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 8.38246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:05,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.65977 samples/s/p 2:37:46 } +2024-07-30 03:30:08,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2680/ 3125], loss: 0.206, per_step_time: 1412ms, lr: 8.379913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:08,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.66203 samples/s/p 2:37:39 } +2024-07-30 03:30:11,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2682/ 3125], loss: 0.554, per_step_time: 1412ms, lr: 8.377367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:11,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.66207 samples/s/p 2:37:36 } +2024-07-30 03:30:14,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2684/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 8.374818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:14,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.66081 samples/s/p 2:37:35 } +2024-07-30 03:30:17,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2686/ 3125], loss: 0.182, per_step_time: 1412ms, lr: 8.372269e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:17,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.66182 samples/s/p 2:37:31 } +2024-07-30 03:30:19,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2688/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 8.369716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:19,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.65967 samples/s/p 2:37:32 } +2024-07-30 03:30:22,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2690/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 8.367164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:22,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.65808 samples/s/p 2:37:31 } +2024-07-30 03:30:25,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2692/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 8.364609e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:25,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.65947 samples/s/p 2:37:26 } +2024-07-30 03:30:28,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2694/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 8.3620525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:28,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.66027 samples/s/p 2:37:22 } +2024-07-30 03:30:31,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2696/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 8.359494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:31,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.66035 samples/s/p 2:37:19 } +2024-07-30 03:30:34,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2698/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 8.356935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:34,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.65831 samples/s/p 2:37:20 } +2024-07-30 03:30:36,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2700/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 8.354374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:36,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.66043 samples/s/p 2:37:13 } +2024-07-30 03:30:39,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2702/ 3125], loss: 0.419, per_step_time: 1414ms, lr: 8.351811e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:39,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.65753 samples/s/p 2:37:15 } +2024-07-30 03:30:42,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2704/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 8.349247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:42,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.66033 samples/s/p 2:37:08 } +2024-07-30 03:30:45,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2706/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 8.34668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:45,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.66145 samples/s/p 2:37:03 } +2024-07-30 03:30:48,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2708/ 3125], loss: 0.245, per_step_time: 1418ms, lr: 8.344113e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:48,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.63904 samples/s/p 2:37:38 } +2024-07-30 03:30:51,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2710/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 8.3415425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:51,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.65931 samples/s/p 2:37:01 } +2024-07-30 03:30:53,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2712/ 3125], loss: 0.291, per_step_time: 1414ms, lr: 8.338972e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:53,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.65687 samples/s/p 2:37:02 } +2024-07-30 03:30:56,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2714/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 8.336399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:56,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.66039 samples/s/p 2:36:54 } +2024-07-30 03:30:59,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2716/ 3125], loss: 0.380, per_step_time: 1414ms, lr: 8.3338255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:59,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.65458 samples/s/p 2:37:01 } +2024-07-30 03:31:02,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2718/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 8.33125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:02,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.65688 samples/s/p 2:36:54 } +2024-07-30 03:31:05,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2720/ 3125], loss: 0.154, per_step_time: 1415ms, lr: 8.328672e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:05,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.65077 samples/s/p 2:37:01 } +2024-07-30 03:31:08,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2722/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 8.326094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:08,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.66037 samples/s/p 2:36:42 } +2024-07-30 03:31:10,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2724/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 8.323513e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:10,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.66007 samples/s/p 2:36:40 } +2024-07-30 03:31:13,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2726/ 3125], loss: 0.214, per_step_time: 1412ms, lr: 8.320931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:13,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.66306 samples/s/p 2:36:32 } +2024-07-30 03:31:16,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2728/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 8.318348e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:16,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.66018 samples/s/p 2:36:34 } +2024-07-30 03:31:19,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2730/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 8.315763e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:19,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.66093 samples/s/p 2:36:30 } +2024-07-30 03:31:22,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2732/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 8.313175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:22,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.66057 samples/s/p 2:36:28 } +2024-07-30 03:31:25,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2734/ 3125], loss: 0.185, per_step_time: 1412ms, lr: 8.310587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:25,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.66202 samples/s/p 2:36:23 } +2024-07-30 03:31:27,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2736/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 8.307998e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:27,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.65954 samples/s/p 2:36:24 } +2024-07-30 03:31:30,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2738/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 8.3054065e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:30,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.65844 samples/s/p 2:36:23 } +2024-07-30 03:31:33,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2740/ 3125], loss: 0.346, per_step_time: 1416ms, lr: 8.3028135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:33,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.64641 samples/s/p 2:36:40 } +2024-07-30 03:31:36,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2742/ 3125], loss: 0.103, per_step_time: 1413ms, lr: 8.300218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:36,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.65805 samples/s/p 2:36:18 } +2024-07-30 03:31:39,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2744/ 3125], loss: 0.310, per_step_time: 1416ms, lr: 8.297622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:39,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.64925 samples/s/p 2:36:30 } +2024-07-30 03:31:42,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2746/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 8.295025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:42,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.65933 samples/s/p 2:36:10 } +2024-07-30 03:31:44,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2748/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 8.292424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:44,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.65892 samples/s/p 2:36:08 } +2024-07-30 03:31:47,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2750/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 8.289823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:47,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.65845 samples/s/p 2:36:06 } +2024-07-30 03:31:50,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2752/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 8.287221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:50,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.65815 samples/s/p 2:36:04 } +2024-07-30 03:31:53,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2754/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 8.284617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:53,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.66067 samples/s/p 2:35:57 } +2024-07-30 03:31:56,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2756/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 8.282012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:56,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.65820 samples/s/p 2:35:58 } +2024-07-30 03:31:59,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2758/ 3125], loss: 0.384, per_step_time: 1413ms, lr: 8.279404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:59,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.66028 samples/s/p 2:35:52 } +2024-07-30 03:32:01,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2760/ 3125], loss: 0.341, per_step_time: 1412ms, lr: 8.276795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:01,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.66289 samples/s/p 2:35:45 } +2024-07-30 03:32:04,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2762/ 3125], loss: 0.064, per_step_time: 1412ms, lr: 8.274184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:04,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.66253 samples/s/p 2:35:42 } +2024-07-30 03:32:07,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2764/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 8.271573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:07,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.65766 samples/s/p 2:35:48 } +2024-07-30 03:32:10,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2766/ 3125], loss: 0.188, per_step_time: 1412ms, lr: 8.26896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:10,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.66172 samples/s/p 2:35:38 } +2024-07-30 03:32:13,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2768/ 3125], loss: 0.217, per_step_time: 1414ms, lr: 8.266344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:13,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.65445 samples/s/p 2:35:47 } +2024-07-30 03:32:16,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2770/ 3125], loss: 0.292, per_step_time: 1417ms, lr: 8.263728e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:16,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.64530 samples/s/p 2:35:59 } +2024-07-30 03:32:18,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2772/ 3125], loss: 0.183, per_step_time: 1414ms, lr: 8.2611095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:18,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.65748 samples/s/p 2:35:37 } +2024-07-30 03:32:21,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2774/ 3125], loss: 0.234, per_step_time: 1416ms, lr: 8.25849e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:21,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.64798 samples/s/p 2:35:49 } +2024-07-30 03:32:24,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2776/ 3125], loss: 0.142, per_step_time: 1413ms, lr: 8.255868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:24,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.65862 samples/s/p 2:35:29 } +2024-07-30 03:32:27,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2778/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 8.253245e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:27,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.66010 samples/s/p 2:35:24 } +2024-07-30 03:32:30,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2780/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 8.250621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:30,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.66098 samples/s/p 2:35:19 } +2024-07-30 03:32:33,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2782/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 8.2479955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:33,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.65970 samples/s/p 2:35:19 } +2024-07-30 03:32:35,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2784/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 8.245368e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:35,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.66091 samples/s/p 2:35:14 } +2024-07-30 03:32:38,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2786/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 8.242739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:38,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.66155 samples/s/p 2:35:10 } +2024-07-30 03:32:41,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2788/ 3125], loss: 0.381, per_step_time: 1413ms, lr: 8.240108e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:41,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.65838 samples/s/p 2:35:12 } +2024-07-30 03:32:44,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2790/ 3125], loss: 0.280, per_step_time: 1412ms, lr: 8.237476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:44,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.66193 samples/s/p 2:35:04 } +2024-07-30 03:32:47,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2792/ 3125], loss: 0.209, per_step_time: 1414ms, lr: 8.234842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:47,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.65516 samples/s/p 2:35:12 } +2024-07-30 03:32:50,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2794/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 8.2322085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:50,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.65832 samples/s/p 2:35:04 } +2024-07-30 03:32:52,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2796/ 3125], loss: 0.398, per_step_time: 1412ms, lr: 8.22957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:52,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.66317 samples/s/p 2:34:53 } +2024-07-30 03:32:55,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2798/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 8.226932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:55,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.66083 samples/s/p 2:34:54 } +2024-07-30 03:32:58,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2800/ 3125], loss: 0.305, per_step_time: 1414ms, lr: 8.224293e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:58,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.65758 samples/s/p 2:34:57 } +2024-07-30 03:32:58,651 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 03:33:33,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2802/ 3125], loss: 0.252, per_step_time: 1417ms, lr: 8.221651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:33,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.64499 samples/s/p 2:35:15 } +2024-07-30 03:33:36,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2804/ 3125], loss: 0.293, per_step_time: 1413ms, lr: 8.219007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:36,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.65879 samples/s/p 2:34:49 } +2024-07-30 03:33:39,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2806/ 3125], loss: 0.327, per_step_time: 1413ms, lr: 8.216363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:39,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.66132 samples/s/p 2:34:42 } +2024-07-30 03:33:42,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2808/ 3125], loss: 0.378, per_step_time: 1414ms, lr: 8.213718e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:42,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.65728 samples/s/p 2:34:46 } +2024-07-30 03:33:44,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2810/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 8.211069e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:44,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.66105 samples/s/p 2:34:37 } +2024-07-30 03:33:47,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2812/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 8.208421e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:47,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.65776 samples/s/p 2:34:39 } +2024-07-30 03:33:50,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2814/ 3125], loss: 0.436, per_step_time: 1413ms, lr: 8.20577e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:50,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |███████████████ | 5.66068 samples/s/p 2:34:32 } +2024-07-30 03:33:53,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2816/ 3125], loss: 0.281, per_step_time: 1414ms, lr: 8.203118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:53,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |███████████████ | 5.65601 samples/s/p 2:34:37 } +2024-07-30 03:33:56,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2818/ 3125], loss: 0.163, per_step_time: 1415ms, lr: 8.200464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:56,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.65081 samples/s/p 2:34:42 } +2024-07-30 03:33:59,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2820/ 3125], loss: 0.291, per_step_time: 1412ms, lr: 8.19781e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:59,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.66201 samples/s/p 2:34:21 } +2024-07-30 03:34:02,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2822/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 8.195152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:02,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.66116 samples/s/p 2:34:20 } +2024-07-30 03:34:04,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2824/ 3125], loss: 0.480, per_step_time: 1412ms, lr: 8.1924945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:04,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.66262 samples/s/p 2:34:15 } +2024-07-30 03:34:07,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2826/ 3125], loss: 0.451, per_step_time: 1421ms, lr: 8.189835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:07,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.62978 samples/s/p 2:35:06 } +2024-07-30 03:34:10,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2828/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 8.187173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:10,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.65777 samples/s/p 2:34:17 } +2024-07-30 03:34:13,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2830/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 8.184512e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:13,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.66057 samples/s/p 2:34:09 } +2024-07-30 03:34:16,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2832/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 8.181846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:16,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.65794 samples/s/p 2:34:11 } +2024-07-30 03:34:19,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2834/ 3125], loss: 0.295, per_step_time: 1414ms, lr: 8.17918e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:19,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.65402 samples/s/p 2:34:15 } +2024-07-30 03:34:21,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2836/ 3125], loss: 0.293, per_step_time: 1413ms, lr: 8.176514e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:21,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.66169 samples/s/p 2:33:59 } +2024-07-30 03:34:24,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2838/ 3125], loss: 0.379, per_step_time: 1413ms, lr: 8.1738435e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:24,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.65888 samples/s/p 2:34:01 } +2024-07-30 03:34:27,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2840/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 8.171173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:27,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.65937 samples/s/p 2:33:57 } +2024-07-30 03:34:30,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2842/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.168502e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:30,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.65883 samples/s/p 2:33:55 } +2024-07-30 03:34:33,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2844/ 3125], loss: 0.376, per_step_time: 1413ms, lr: 8.165828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:33,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.66082 samples/s/p 2:33:49 } +2024-07-30 03:34:36,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2846/ 3125], loss: 0.265, per_step_time: 1414ms, lr: 8.163152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:36,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.65455 samples/s/p 2:33:57 } +2024-07-30 03:34:38,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2848/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 8.160477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:38,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.65879 samples/s/p 2:33:47 } +2024-07-30 03:34:41,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2850/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 8.157799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:41,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.65943 samples/s/p 2:33:43 } +2024-07-30 03:34:44,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2852/ 3125], loss: 0.294, per_step_time: 1425ms, lr: 8.155119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:44,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.61188 samples/s/p 2:34:58 } +2024-07-30 03:34:47,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2854/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 8.152439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:47,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.66151 samples/s/p 2:33:34 } +2024-07-30 03:34:50,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2856/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 8.149756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:50,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.66126 samples/s/p 2:33:32 } +2024-07-30 03:34:53,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2858/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 8.147072e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:53,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.66111 samples/s/p 2:33:29 } +2024-07-30 03:34:55,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2860/ 3125], loss: 0.232, per_step_time: 1415ms, lr: 8.144387e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:55,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.65157 samples/s/p 2:33:42 } +2024-07-30 03:34:58,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2862/ 3125], loss: 0.199, per_step_time: 1415ms, lr: 8.1417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:58,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.65133 samples/s/p 2:33:39 } +2024-07-30 03:35:01,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2864/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 8.139012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:01,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.66127 samples/s/p 2:33:20 } +2024-07-30 03:35:04,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2866/ 3125], loss: 0.137, per_step_time: 1414ms, lr: 8.1363205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:04,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.65451 samples/s/p 2:33:28 } +2024-07-30 03:35:07,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2868/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 8.133629e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:07,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.66057 samples/s/p 2:33:16 } +2024-07-30 03:35:10,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2870/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 8.130936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:10,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.66011 samples/s/p 2:33:14 } +2024-07-30 03:35:13,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2872/ 3125], loss: 0.205, per_step_time: 1417ms, lr: 8.1282415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:13,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.64517 samples/s/p 2:33:35 } +2024-07-30 03:35:16,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2874/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 8.125546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:16,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.65832 samples/s/p 2:33:11 } +2024-07-30 03:35:19,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2876/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 8.122848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:19,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.65954 samples/s/p 2:33:06 } +2024-07-30 03:35:21,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2878/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 8.12015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:21,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.66025 samples/s/p 2:33:02 } +2024-07-30 03:35:24,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2880/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 8.117449e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:24,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.66001 samples/s/p 2:33:00 } +2024-07-30 03:35:27,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2882/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 8.114746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:27,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.65778 samples/s/p 2:33:00 } +2024-07-30 03:35:30,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2884/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 8.112043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:30,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.65879 samples/s/p 2:32:56 } +2024-07-30 03:35:33,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2886/ 3125], loss: 0.262, per_step_time: 1415ms, lr: 8.109339e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:33,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.65289 samples/s/p 2:33:03 } +2024-07-30 03:35:36,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2888/ 3125], loss: 0.190, per_step_time: 1417ms, lr: 8.106633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:36,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.64431 samples/s/p 2:33:14 } +2024-07-30 03:35:38,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2890/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 8.103924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:38,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.65789 samples/s/p 2:32:49 } +2024-07-30 03:35:41,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2892/ 3125], loss: 0.357, per_step_time: 1414ms, lr: 8.101215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:41,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.65644 samples/s/p 2:32:49 } +2024-07-30 03:35:44,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2894/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 8.098505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:44,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.66047 samples/s/p 2:32:39 } +2024-07-30 03:35:47,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2896/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 8.0957925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:47,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.65733 samples/s/p 2:32:41 } +2024-07-30 03:35:50,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2898/ 3125], loss: 0.418, per_step_time: 1413ms, lr: 8.0930795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:50,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.65890 samples/s/p 2:32:36 } +2024-07-30 03:35:53,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2900/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 8.090362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:53,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.66068 samples/s/p 2:32:30 } +2024-07-30 03:35:55,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2902/ 3125], loss: 0.190, per_step_time: 1414ms, lr: 8.087645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:55,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.65388 samples/s/p 2:32:39 } +2024-07-30 03:35:58,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2904/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 8.084929e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:58,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.66107 samples/s/p 2:32:24 } +2024-07-30 03:36:01,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2906/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 8.082207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:01,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.66141 samples/s/p 2:32:21 } +2024-07-30 03:36:04,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2908/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 8.079487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:04,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.65979 samples/s/p 2:32:20 } +2024-07-30 03:36:07,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2910/ 3125], loss: 0.122, per_step_time: 1413ms, lr: 8.076764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:07,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.65904 samples/s/p 2:32:19 } +2024-07-30 03:36:10,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2912/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 8.07404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:10,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.65914 samples/s/p 2:32:16 } +2024-07-30 03:36:13,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2914/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 8.071315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:13,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.65993 samples/s/p 2:32:12 } +2024-07-30 03:36:15,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2916/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 8.068589e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:15,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.65997 samples/s/p 2:32:09 } +2024-07-30 03:36:18,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2918/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 8.065859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:18,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.65790 samples/s/p 2:32:09 } +2024-07-30 03:36:21,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2920/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 8.063129e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:21,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.66088 samples/s/p 2:32:02 } +2024-07-30 03:36:24,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2922/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 8.060398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:24,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.66084 samples/s/p 2:31:59 } +2024-07-30 03:36:27,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2924/ 3125], loss: 0.187, per_step_time: 1414ms, lr: 8.057666e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:27,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.65535 samples/s/p 2:32:05 } +2024-07-30 03:36:30,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2926/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 8.05493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:30,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.66011 samples/s/p 2:31:55 } +2024-07-30 03:36:32,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2928/ 3125], loss: 0.356, per_step_time: 1414ms, lr: 8.052194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:32,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.65760 samples/s/p 2:31:56 } +2024-07-30 03:36:35,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2930/ 3125], loss: 0.226, per_step_time: 1414ms, lr: 8.049457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:35,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.65620 samples/s/p 2:31:55 } +2024-07-30 03:36:38,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2932/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 8.046719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:38,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.65971 samples/s/p 2:31:47 } +2024-07-30 03:36:41,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2934/ 3125], loss: 0.144, per_step_time: 1412ms, lr: 8.043978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:41,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.66223 samples/s/p 2:31:40 } +2024-07-30 03:36:44,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2936/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 8.0412365e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:44,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.66018 samples/s/p 2:31:40 } +2024-07-30 03:36:47,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2938/ 3125], loss: 0.393, per_step_time: 1413ms, lr: 8.038493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:47,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.65971 samples/s/p 2:31:38 } +2024-07-30 03:36:49,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2940/ 3125], loss: 0.201, per_step_time: 1414ms, lr: 8.035749e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:49,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.65451 samples/s/p 2:31:44 } +2024-07-30 03:36:52,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2942/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 8.033003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:52,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.65933 samples/s/p 2:31:33 } +2024-07-30 03:36:55,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2944/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 8.030256e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:55,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.66078 samples/s/p 2:31:28 } +2024-07-30 03:36:58,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2946/ 3125], loss: 0.417, per_step_time: 1413ms, lr: 8.027507e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:58,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.65846 samples/s/p 2:31:29 } +2024-07-30 03:37:01,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2948/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 8.024756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:01,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.66060 samples/s/p 2:31:23 } +2024-07-30 03:37:04,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2950/ 3125], loss: 0.508, per_step_time: 1413ms, lr: 8.022005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:04,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.65779 samples/s/p 2:31:24 } +2024-07-30 03:37:06,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2952/ 3125], loss: 0.124, per_step_time: 1415ms, lr: 8.019252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:06,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.65068 samples/s/p 2:31:33 } +2024-07-30 03:37:09,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2954/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 8.016496e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:09,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.66153 samples/s/p 2:31:13 } +2024-07-30 03:37:12,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2956/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 8.013741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:12,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.66054 samples/s/p 2:31:11 } +2024-07-30 03:37:15,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2958/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 8.010983e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:15,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.65958 samples/s/p 2:31:10 } +2024-07-30 03:37:18,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2960/ 3125], loss: 0.058, per_step_time: 1413ms, lr: 8.008224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:18,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.65979 samples/s/p 2:31:07 } +2024-07-30 03:37:21,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2962/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 8.005464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:21,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.65890 samples/s/p 2:31:06 } +2024-07-30 03:37:23,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2964/ 3125], loss: 0.201, per_step_time: 1415ms, lr: 8.002702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:23,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.65311 samples/s/p 2:31:12 } +2024-07-30 03:37:26,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2966/ 3125], loss: 0.116, per_step_time: 1413ms, lr: 7.999938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:26,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.65985 samples/s/p 2:30:58 } +2024-07-30 03:37:29,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2968/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 7.997174e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:29,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.65907 samples/s/p 2:30:57 } +2024-07-30 03:37:32,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2970/ 3125], loss: 0.396, per_step_time: 1414ms, lr: 7.9944075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:32,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.65581 samples/s/p 2:30:59 } +2024-07-30 03:37:35,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2972/ 3125], loss: 0.248, per_step_time: 1414ms, lr: 7.991641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:35,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.65691 samples/s/p 2:30:55 } +2024-07-30 03:37:38,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2974/ 3125], loss: 0.402, per_step_time: 1415ms, lr: 7.988871e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:38,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.65250 samples/s/p 2:30:59 } +2024-07-30 03:37:40,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2976/ 3125], loss: 0.045, per_step_time: 1413ms, lr: 7.986101e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:40,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.66072 samples/s/p 2:30:43 } +2024-07-30 03:37:43,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2978/ 3125], loss: 0.486, per_step_time: 1413ms, lr: 7.983329e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:43,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.65945 samples/s/p 2:30:42 } +2024-07-30 03:37:46,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2980/ 3125], loss: 0.218, per_step_time: 1414ms, lr: 7.980555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:46,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.65627 samples/s/p 2:30:44 } +2024-07-30 03:37:49,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2982/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 7.977781e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:49,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.66075 samples/s/p 2:30:34 } +2024-07-30 03:37:52,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2984/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 7.975005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:52,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.65940 samples/s/p 2:30:34 } +2024-07-30 03:37:55,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2986/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 7.972229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:55,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.66097 samples/s/p 2:30:28 } +2024-07-30 03:37:57,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2988/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 7.969448e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:57,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.65791 samples/s/p 2:30:30 } +2024-07-30 03:38:00,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2990/ 3125], loss: 0.119, per_step_time: 1412ms, lr: 7.966668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:00,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.66262 samples/s/p 2:30:20 } +2024-07-30 03:38:03,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2992/ 3125], loss: 0.206, per_step_time: 1415ms, lr: 7.963886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:03,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.65290 samples/s/p 2:30:33 } +2024-07-30 03:38:06,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2994/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 7.961103e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:06,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.65670 samples/s/p 2:30:24 } +2024-07-30 03:38:09,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2996/ 3125], loss: 0.146, per_step_time: 1414ms, lr: 7.958318e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:09,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |███████████████ | 5.65654 samples/s/p 2:30:21 } +2024-07-30 03:38:12,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2998/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 7.955532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:12,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |███████████████ | 5.66072 samples/s/p 2:30:12 } +2024-07-30 03:38:14,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3000/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 7.952744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:14,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.65882 samples/s/p 2:30:12 } +2024-07-30 03:38:17,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3002/ 3125], loss: 0.105, per_step_time: 1413ms, lr: 7.949957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:17,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.66138 samples/s/p 2:30:05 } +2024-07-30 03:38:20,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3004/ 3125], loss: 0.164, per_step_time: 1413ms, lr: 7.9471665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:20,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.65984 samples/s/p 2:30:05 } +2024-07-30 03:38:23,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3006/ 3125], loss: 0.330, per_step_time: 1413ms, lr: 7.9443735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:23,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.66112 samples/s/p 2:30:00 } +2024-07-30 03:38:26,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3008/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 7.94158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:26,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.65926 samples/s/p 2:30:00 } +2024-07-30 03:38:29,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3010/ 3125], loss: 0.503, per_step_time: 1413ms, lr: 7.938786e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:29,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.66040 samples/s/p 2:29:55 } +2024-07-30 03:38:31,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3012/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 7.93599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:31,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.66051 samples/s/p 2:29:52 } +2024-07-30 03:38:34,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3014/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 7.933193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:34,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.65893 samples/s/p 2:29:52 } +2024-07-30 03:38:37,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3016/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 7.9303945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:37,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.65921 samples/s/p 2:29:49 } +2024-07-30 03:38:40,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3018/ 3125], loss: 0.073, per_step_time: 1413ms, lr: 7.927595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:40,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.66011 samples/s/p 2:29:44 } +2024-07-30 03:38:43,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3020/ 3125], loss: 0.311, per_step_time: 1415ms, lr: 7.924794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:43,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.65307 samples/s/p 2:29:53 } +2024-07-30 03:38:46,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3022/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 7.92199e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:46,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.65845 samples/s/p 2:29:41 } +2024-07-30 03:38:48,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3024/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 7.919186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:48,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.66013 samples/s/p 2:29:36 } +2024-07-30 03:38:51,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3026/ 3125], loss: 0.484, per_step_time: 1414ms, lr: 7.91638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:51,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.65635 samples/s/p 2:29:39 } +2024-07-30 03:38:54,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3028/ 3125], loss: 0.343, per_step_time: 1414ms, lr: 7.9135725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:54,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.65402 samples/s/p 2:29:40 } +2024-07-30 03:38:57,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3030/ 3125], loss: 0.262, per_step_time: 1414ms, lr: 7.910764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:57,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.65724 samples/s/p 2:29:32 } +2024-07-30 03:39:00,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3032/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 7.907955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:00,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.65604 samples/s/p 2:29:31 } +2024-07-30 03:39:03,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3034/ 3125], loss: 0.175, per_step_time: 1414ms, lr: 7.905143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:03,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.65440 samples/s/p 2:29:31 } +2024-07-30 03:39:05,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3036/ 3125], loss: 0.197, per_step_time: 1413ms, lr: 7.902331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:05,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.66155 samples/s/p 2:29:17 } +2024-07-30 03:39:08,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3038/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 7.899518e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:08,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.66118 samples/s/p 2:29:15 } +2024-07-30 03:39:11,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3040/ 3125], loss: 0.386, per_step_time: 1412ms, lr: 7.896702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:11,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.66263 samples/s/p 2:29:09 } +2024-07-30 03:39:14,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3042/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 7.893886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:14,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.65869 samples/s/p 2:29:13 } +2024-07-30 03:39:17,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3044/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 7.891067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:17,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.66120 samples/s/p 2:29:06 } +2024-07-30 03:39:20,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3046/ 3125], loss: 0.483, per_step_time: 1413ms, lr: 7.888248e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:20,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.65963 samples/s/p 2:29:06 } +2024-07-30 03:39:22,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3048/ 3125], loss: 0.188, per_step_time: 1412ms, lr: 7.885426e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:22,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.66201 samples/s/p 2:28:59 } +2024-07-30 03:39:25,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3050/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 7.882604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:25,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.66158 samples/s/p 2:28:57 } +2024-07-30 03:39:28,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3052/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 7.87978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:28,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.66127 samples/s/p 2:28:55 } +2024-07-30 03:39:31,405 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3054/ 3125], loss: 0.430, per_step_time: 1413ms, lr: 7.876955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:31,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.66033 samples/s/p 2:28:53 } +2024-07-30 03:39:34,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3056/ 3125], loss: 0.063, per_step_time: 1413ms, lr: 7.874129e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:34,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.66107 samples/s/p 2:28:49 } +2024-07-30 03:39:37,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3058/ 3125], loss: 0.166, per_step_time: 1414ms, lr: 7.871301e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:37,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.65701 samples/s/p 2:28:53 } +2024-07-30 03:39:39,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3060/ 3125], loss: 0.244, per_step_time: 1412ms, lr: 7.8684725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:39,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.66239 samples/s/p 2:28:42 } +2024-07-30 03:39:42,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3062/ 3125], loss: 0.327, per_step_time: 1413ms, lr: 7.865641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:42,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.65987 samples/s/p 2:28:43 } +2024-07-30 03:39:45,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3064/ 3125], loss: 0.158, per_step_time: 1413ms, lr: 7.862808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:45,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.65847 samples/s/p 2:28:42 } +2024-07-30 03:39:48,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3066/ 3125], loss: 0.247, per_step_time: 1412ms, lr: 7.859976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:48,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.66421 samples/s/p 2:28:30 } +2024-07-30 03:39:51,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3068/ 3125], loss: 0.360, per_step_time: 1414ms, lr: 7.857141e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:51,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.65661 samples/s/p 2:28:39 } +2024-07-30 03:39:54,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3070/ 3125], loss: 0.408, per_step_time: 1415ms, lr: 7.854305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:54,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.65282 samples/s/p 2:28:42 } +2024-07-30 03:39:56,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3072/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 7.851468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:56,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.65976 samples/s/p 2:28:29 } +2024-07-30 03:39:59,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3074/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 7.84863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:59,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.65938 samples/s/p 2:28:26 } +2024-07-30 03:40:02,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3076/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 7.845789e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:02,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.65977 samples/s/p 2:28:23 } +2024-07-30 03:40:05,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3078/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 7.842948e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:05,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.65915 samples/s/p 2:28:21 } +2024-07-30 03:40:08,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3080/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 7.840105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:08,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.65854 samples/s/p 2:28:19 } +2024-07-30 03:40:11,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3082/ 3125], loss: 0.274, per_step_time: 1414ms, lr: 7.8372605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:11,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.65660 samples/s/p 2:28:20 } +2024-07-30 03:40:13,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3084/ 3125], loss: 0.207, per_step_time: 1414ms, lr: 7.834416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:13,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.65702 samples/s/p 2:28:16 } +2024-07-30 03:40:16,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3086/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 7.831569e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:16,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.66111 samples/s/p 2:28:07 } +2024-07-30 03:40:19,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3088/ 3125], loss: 0.198, per_step_time: 1412ms, lr: 7.82872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:19,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.66182 samples/s/p 2:28:03 } +2024-07-30 03:40:22,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3090/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 7.825871e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:22,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.66079 samples/s/p 2:28:02 } +2024-07-30 03:40:25,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3092/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 7.82302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:25,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.65923 samples/s/p 2:28:01 } +2024-07-30 03:40:28,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3094/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 7.820167e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:28,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.66015 samples/s/p 2:27:57 } +2024-07-30 03:40:30,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3096/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 7.817314e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:30,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.65861 samples/s/p 2:27:57 } +2024-07-30 03:40:33,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3098/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 7.814459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:33,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.65977 samples/s/p 2:27:52 } +2024-07-30 03:40:36,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3100/ 3125], loss: 0.094, per_step_time: 1413ms, lr: 7.811602e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:36,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.66002 samples/s/p 2:27:49 } +2024-07-30 03:40:39,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3102/ 3125], loss: 0.340, per_step_time: 1414ms, lr: 7.808745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:39,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.65748 samples/s/p 2:27:50 } +2024-07-30 03:40:42,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3104/ 3125], loss: 0.542, per_step_time: 1414ms, lr: 7.8058865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:42,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.65500 samples/s/p 2:27:51 } +2024-07-30 03:40:45,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3106/ 3125], loss: 0.421, per_step_time: 1413ms, lr: 7.803026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:45,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.66077 samples/s/p 2:27:39 } +2024-07-30 03:40:47,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3108/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 7.800165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:47,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.65906 samples/s/p 2:27:39 } +2024-07-30 03:40:50,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3110/ 3125], loss: 0.137, per_step_time: 1413ms, lr: 7.797301e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:50,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.66097 samples/s/p 2:27:33 } +2024-07-30 03:40:53,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3112/ 3125], loss: 0.390, per_step_time: 1413ms, lr: 7.794437e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:53,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.66047 samples/s/p 2:27:31 } +2024-07-30 03:40:56,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3114/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 7.791571e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:56,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.66028 samples/s/p 2:27:29 } +2024-07-30 03:40:59,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3116/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 7.788703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:59,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.66029 samples/s/p 2:27:26 } +2024-07-30 03:41:02,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3118/ 3125], loss: 0.107, per_step_time: 1414ms, lr: 7.785835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:02,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.65614 samples/s/p 2:27:29 } +2024-07-30 03:41:04,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3120/ 3125], loss: 0.323, per_step_time: 1414ms, lr: 7.782965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:04,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.65751 samples/s/p 2:27:24 } +2024-07-30 03:41:07,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3122/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 7.780095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:07,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.65903 samples/s/p 2:27:19 } +2024-07-30 03:41:10,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3124/ 3125], loss: 0.356, per_step_time: 1413ms, lr: 7.777224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:10,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.65778 samples/s/p 2:27:18 } +2024-07-30 03:41:13,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 7.774349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:13,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.65786 samples/s/p 2:27:15 } +2024-07-30 03:41:16,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3/ 3125], loss: 0.242, per_step_time: 1414ms, lr: 7.771474e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:16,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.65694 samples/s/p 2:27:14 } +2024-07-30 03:41:19,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 5/ 3125], loss: 0.122, per_step_time: 1413ms, lr: 7.768598e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:19,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.65856 samples/s/p 2:27:09 } +2024-07-30 03:41:21,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 7/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 7.7657205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:21,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.65951 samples/s/p 2:27:04 } +2024-07-30 03:41:24,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 9/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 7.762842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:24,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.66036 samples/s/p 2:27:00 } +2024-07-30 03:41:27,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 11/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 7.759961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:27,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.65824 samples/s/p 2:27:01 } +2024-07-30 03:41:30,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 13/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 7.757079e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:30,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.66129 samples/s/p 2:26:53 } +2024-07-30 03:41:33,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 15/ 3125], loss: 0.090, per_step_time: 1412ms, lr: 7.754197e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:33,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.66174 samples/s/p 2:26:50 } +2024-07-30 03:41:36,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 17/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 7.751312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:36,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.66033 samples/s/p 2:26:49 } +2024-07-30 03:41:38,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 19/ 3125], loss: 0.346, per_step_time: 1412ms, lr: 7.748427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:38,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.66193 samples/s/p 2:26:44 } +2024-07-30 03:41:41,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 21/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 7.74554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:41,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.66039 samples/s/p 2:26:43 } +2024-07-30 03:41:44,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 23/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 7.742651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:44,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.66007 samples/s/p 2:26:41 } +2024-07-30 03:41:47,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 25/ 3125], loss: 0.442, per_step_time: 1413ms, lr: 7.739762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:47,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.66018 samples/s/p 2:26:38 } +2024-07-30 03:41:50,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 27/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 7.736871e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:50,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.65875 samples/s/p 2:26:37 } +2024-07-30 03:41:53,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 29/ 3125], loss: 0.158, per_step_time: 1412ms, lr: 7.733979e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:53,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.66181 samples/s/p 2:26:30 } +2024-07-30 03:41:55,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 31/ 3125], loss: 0.160, per_step_time: 1413ms, lr: 7.731086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:55,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.65974 samples/s/p 2:26:30 } +2024-07-30 03:41:58,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 33/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 7.728191e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:58,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.66084 samples/s/p 2:26:25 } +2024-07-30 03:42:01,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 35/ 3125], loss: 0.050, per_step_time: 1413ms, lr: 7.725296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:01,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.66090 samples/s/p 2:26:23 } +2024-07-30 03:42:04,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 37/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 7.7223995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:04,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.65894 samples/s/p 2:26:23 } +2024-07-30 03:42:07,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 39/ 3125], loss: 0.476, per_step_time: 1413ms, lr: 7.7195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:07,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.65977 samples/s/p 2:26:19 } +2024-07-30 03:42:10,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 41/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 7.7166005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:10,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.66140 samples/s/p 2:26:13 } +2024-07-30 03:42:12,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 43/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 7.713699e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:12,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.66055 samples/s/p 2:26:12 } +2024-07-30 03:42:15,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 45/ 3125], loss: 0.356, per_step_time: 1413ms, lr: 7.710796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:15,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.65908 samples/s/p 2:26:11 } +2024-07-30 03:42:18,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 47/ 3125], loss: 0.262, per_step_time: 1414ms, lr: 7.707892e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:18,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.65595 samples/s/p 2:26:13 } +2024-07-30 03:42:21,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 49/ 3125], loss: 0.134, per_step_time: 1415ms, lr: 7.704987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:21,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.65329 samples/s/p 2:26:15 } +2024-07-30 03:42:24,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 51/ 3125], loss: 0.254, per_step_time: 1415ms, lr: 7.702081e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:24,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.65348 samples/s/p 2:26:11 } +2024-07-30 03:42:27,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 53/ 3125], loss: 0.330, per_step_time: 1414ms, lr: 7.699174e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:27,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.65648 samples/s/p 2:26:04 } +2024-07-30 03:42:29,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 55/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 7.696265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:29,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.66008 samples/s/p 2:25:56 } +2024-07-30 03:42:32,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 57/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 7.693354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:32,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.66171 samples/s/p 2:25:50 } +2024-07-30 03:42:35,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 59/ 3125], loss: 0.539, per_step_time: 1413ms, lr: 7.6904425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:35,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |████████████████ | 5.66035 samples/s/p 2:25:49 } +2024-07-30 03:42:38,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 61/ 3125], loss: 0.441, per_step_time: 1413ms, lr: 7.687529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:38,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |████████████████ | 5.65871 samples/s/p 2:25:49 } +2024-07-30 03:42:41,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 63/ 3125], loss: 0.299, per_step_time: 1414ms, lr: 7.684615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:41,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.65681 samples/s/p 2:25:49 } +2024-07-30 03:42:44,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 65/ 3125], loss: 0.268, per_step_time: 1412ms, lr: 7.6817005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:44,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.66248 samples/s/p 2:25:38 } +2024-07-30 03:42:46,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 67/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 7.678784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:46,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.65780 samples/s/p 2:25:42 } +2024-07-30 03:42:49,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 69/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 7.675866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:49,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.65870 samples/s/p 2:25:38 } +2024-07-30 03:42:52,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 71/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 7.6729475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:52,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.65959 samples/s/p 2:25:34 } +2024-07-30 03:42:55,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 73/ 3125], loss: 0.266, per_step_time: 1425ms, lr: 7.670027e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:55,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.61266 samples/s/p 2:26:44 } +2024-07-30 03:42:58,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 75/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 7.667105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:58,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.66093 samples/s/p 2:25:26 } +2024-07-30 03:43:01,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 77/ 3125], loss: 0.197, per_step_time: 1413ms, lr: 7.664182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:01,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.65996 samples/s/p 2:25:25 } +2024-07-30 03:43:03,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 79/ 3125], loss: 0.398, per_step_time: 1413ms, lr: 7.661257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:03,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.65930 samples/s/p 2:25:23 } +2024-07-30 03:43:06,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 81/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 7.658331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:06,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.66091 samples/s/p 2:25:18 } +2024-07-30 03:43:09,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 83/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 7.655404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:09,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.66084 samples/s/p 2:25:15 } +2024-07-30 03:43:12,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 85/ 3125], loss: 0.280, per_step_time: 1412ms, lr: 7.652477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:12,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.66247 samples/s/p 2:25:09 } +2024-07-30 03:43:15,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 87/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 7.649548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:15,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.65880 samples/s/p 2:25:12 } +2024-07-30 03:43:18,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 89/ 3125], loss: 0.140, per_step_time: 1412ms, lr: 7.646618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:18,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.66232 samples/s/p 2:25:04 } +2024-07-30 03:43:20,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 91/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 7.643685e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:20,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.65929 samples/s/p 2:25:06 } +2024-07-30 03:43:23,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 93/ 3125], loss: 0.460, per_step_time: 1413ms, lr: 7.640752e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:23,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.66087 samples/s/p 2:25:01 } +2024-07-30 03:43:26,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 95/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 7.637817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:26,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.66139 samples/s/p 2:24:57 } +2024-07-30 03:43:29,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 97/ 3125], loss: 0.124, per_step_time: 1413ms, lr: 7.6348815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:29,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.66132 samples/s/p 2:24:54 } +2024-07-30 03:43:32,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 99/ 3125], loss: 0.180, per_step_time: 1414ms, lr: 7.631944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:32,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.65616 samples/s/p 2:24:59 } +2024-07-30 03:43:35,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 101/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 7.629007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:35,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.65990 samples/s/p 2:24:51 } +2024-07-30 03:43:37,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 103/ 3125], loss: 0.317, per_step_time: 1414ms, lr: 7.626067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:37,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.65680 samples/s/p 2:24:53 } +2024-07-30 03:43:40,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 105/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 7.6231267e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:40,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.65815 samples/s/p 2:24:48 } +2024-07-30 03:43:43,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 107/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 7.6201854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:43,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.65679 samples/s/p 2:24:47 } +2024-07-30 03:43:46,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 109/ 3125], loss: 0.124, per_step_time: 1413ms, lr: 7.6172423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:46,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.66004 samples/s/p 2:24:39 } +2024-07-30 03:43:49,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 111/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 7.614297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:49,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.66057 samples/s/p 2:24:36 } +2024-07-30 03:43:52,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 113/ 3125], loss: 0.330, per_step_time: 1413ms, lr: 7.6113506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:52,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.66002 samples/s/p 2:24:34 } +2024-07-30 03:43:54,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 115/ 3125], loss: 0.049, per_step_time: 1412ms, lr: 7.608404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:54,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.66246 samples/s/p 2:24:27 } +2024-07-30 03:43:57,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 117/ 3125], loss: 0.554, per_step_time: 1413ms, lr: 7.6054557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:57,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.65933 samples/s/p 2:24:29 } +2024-07-30 03:44:00,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 119/ 3125], loss: 0.228, per_step_time: 1425ms, lr: 7.6025067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:00,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.61150 samples/s/p 2:25:40 } +2024-07-30 03:44:03,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 121/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 7.5995563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:03,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.66110 samples/s/p 2:24:21 } +2024-07-30 03:44:06,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 123/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 7.5966045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:06,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.65798 samples/s/p 2:24:23 } +2024-07-30 03:44:09,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 125/ 3125], loss: 0.255, per_step_time: 1414ms, lr: 7.5936505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:09,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.65755 samples/s/p 2:24:20 } +2024-07-30 03:44:12,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 127/ 3125], loss: 0.366, per_step_time: 1414ms, lr: 7.5906964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:12,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.65566 samples/s/p 2:24:21 } +2024-07-30 03:44:14,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 129/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 7.5877415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:14,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.65816 samples/s/p 2:24:14 } +2024-07-30 03:44:17,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 131/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 7.5847843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:17,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.65976 samples/s/p 2:24:09 } +2024-07-30 03:44:20,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 133/ 3125], loss: 0.160, per_step_time: 1414ms, lr: 7.5818257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:20,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.65751 samples/s/p 2:24:09 } +2024-07-30 03:44:23,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 135/ 3125], loss: 0.249, per_step_time: 1414ms, lr: 7.578866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:23,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.65709 samples/s/p 2:24:07 } +2024-07-30 03:44:26,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 137/ 3125], loss: 0.145, per_step_time: 1413ms, lr: 7.5759062e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:26,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.65835 samples/s/p 2:24:02 } +2024-07-30 03:44:29,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 139/ 3125], loss: 0.216, per_step_time: 1415ms, lr: 7.5729445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:29,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.65275 samples/s/p 2:24:08 } +2024-07-30 03:44:31,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 141/ 3125], loss: 0.128, per_step_time: 1412ms, lr: 7.569982e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:31,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.66172 samples/s/p 2:23:52 } +2024-07-30 03:44:34,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 143/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 7.567018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:34,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.65801 samples/s/p 2:23:54 } +2024-07-30 03:44:37,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 145/ 3125], loss: 0.406, per_step_time: 1412ms, lr: 7.5640514e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:37,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.66251 samples/s/p 2:23:45 } +2024-07-30 03:44:40,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 147/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 7.5610837e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:40,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.65932 samples/s/p 2:23:47 } +2024-07-30 03:44:43,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 149/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 7.5581165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:43,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.66166 samples/s/p 2:23:40 } +2024-07-30 03:44:46,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 151/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 7.555147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:46,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.66148 samples/s/p 2:23:38 } +2024-07-30 03:44:48,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 153/ 3125], loss: 0.151, per_step_time: 1413ms, lr: 7.5521775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:48,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.66078 samples/s/p 2:23:36 } +2024-07-30 03:44:51,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 155/ 3125], loss: 0.485, per_step_time: 1412ms, lr: 7.5492057e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:51,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.66215 samples/s/p 2:23:31 } +2024-07-30 03:44:54,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 157/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 7.5462335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:54,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.65989 samples/s/p 2:23:32 } +2024-07-30 03:44:57,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 159/ 3125], loss: 0.145, per_step_time: 1412ms, lr: 7.5432595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:57,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.66273 samples/s/p 2:23:25 } +2024-07-30 03:45:00,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 161/ 3125], loss: 0.241, per_step_time: 1412ms, lr: 7.5402836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:00,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.66347 samples/s/p 2:23:21 } +2024-07-30 03:45:03,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 163/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 7.5373077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:03,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.65835 samples/s/p 2:23:26 } +2024-07-30 03:45:05,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 165/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 7.5343296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:05,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.66000 samples/s/p 2:23:20 } +2024-07-30 03:45:08,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 167/ 3125], loss: 0.382, per_step_time: 1414ms, lr: 7.5313505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:08,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.65755 samples/s/p 2:23:21 } +2024-07-30 03:45:11,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 169/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 7.5283706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:11,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.66101 samples/s/p 2:23:13 } +2024-07-30 03:45:14,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 171/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 7.525389e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:14,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.66108 samples/s/p 2:23:10 } +2024-07-30 03:45:17,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 173/ 3125], loss: 0.153, per_step_time: 1414ms, lr: 7.522407e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:17,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.65718 samples/s/p 2:23:13 } +2024-07-30 03:45:20,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 175/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 7.519424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:20,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.65858 samples/s/p 2:23:08 } +2024-07-30 03:45:22,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 177/ 3125], loss: 0.129, per_step_time: 1413ms, lr: 7.516439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:22,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.66027 samples/s/p 2:23:03 } +2024-07-30 03:45:25,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 179/ 3125], loss: 0.139, per_step_time: 1413ms, lr: 7.5134526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:25,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.66112 samples/s/p 2:22:59 } +2024-07-30 03:45:28,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 181/ 3125], loss: 0.536, per_step_time: 1414ms, lr: 7.5104654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:28,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.65495 samples/s/p 2:23:05 } +2024-07-30 03:45:31,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 183/ 3125], loss: 0.254, per_step_time: 1414ms, lr: 7.5074754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:31,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.65734 samples/s/p 2:22:59 } +2024-07-30 03:45:34,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 185/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 7.5044863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:34,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.66131 samples/s/p 2:22:50 } +2024-07-30 03:45:37,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 187/ 3125], loss: 0.253, per_step_time: 1414ms, lr: 7.501496e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:37,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.65574 samples/s/p 2:22:56 } +2024-07-30 03:45:39,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 189/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 7.4985037e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:39,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.65853 samples/s/p 2:22:49 } +2024-07-30 03:45:42,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 191/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 7.495511e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:42,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.65940 samples/s/p 2:22:44 } +2024-07-30 03:45:45,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 193/ 3125], loss: 0.382, per_step_time: 1413ms, lr: 7.4925165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:45,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.65797 samples/s/p 2:22:44 } +2024-07-30 03:45:48,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 195/ 3125], loss: 0.408, per_step_time: 1414ms, lr: 7.4895215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:48,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.65725 samples/s/p 2:22:42 } +2024-07-30 03:45:51,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 197/ 3125], loss: 0.272, per_step_time: 1417ms, lr: 7.4865234e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:51,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.64500 samples/s/p 2:22:58 } +2024-07-30 03:45:54,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 199/ 3125], loss: 0.393, per_step_time: 1414ms, lr: 7.4835257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:54,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.65503 samples/s/p 2:22:40 } +2024-07-30 03:45:56,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 201/ 3125], loss: 0.027, per_step_time: 1413ms, lr: 7.4805257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:56,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.65812 samples/s/p 2:22:32 } +2024-07-30 03:45:59,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 203/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 7.4775253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:59,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.65999 samples/s/p 2:22:27 } +2024-07-30 03:46:02,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 205/ 3125], loss: 0.199, per_step_time: 1414ms, lr: 7.4745244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:02,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.65698 samples/s/p 2:22:28 } +2024-07-30 03:46:05,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 207/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 7.4715217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:05,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.65982 samples/s/p 2:22:21 } +2024-07-30 03:46:08,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 209/ 3125], loss: 0.076, per_step_time: 1413ms, lr: 7.4685177e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:08,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.66155 samples/s/p 2:22:16 } +2024-07-30 03:46:11,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 211/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 7.465513e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:11,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.65961 samples/s/p 2:22:16 } +2024-07-30 03:46:13,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 213/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 7.462506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:13,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.65927 samples/s/p 2:22:13 } +2024-07-30 03:46:16,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 215/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 7.4594986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:16,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.66086 samples/s/p 2:22:08 } +2024-07-30 03:46:19,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 217/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 7.45649e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:19,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.66032 samples/s/p 2:22:06 } +2024-07-30 03:46:22,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 219/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 7.4534796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:22,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.66137 samples/s/p 2:22:02 } +2024-07-30 03:46:25,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 221/ 3125], loss: 0.212, per_step_time: 1412ms, lr: 7.4504687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:25,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.66195 samples/s/p 2:21:58 } +2024-07-30 03:46:28,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 223/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 7.447457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:28,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.66122 samples/s/p 2:21:56 } +2024-07-30 03:46:30,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 225/ 3125], loss: 0.200, per_step_time: 1412ms, lr: 7.4444433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:30,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.66259 samples/s/p 2:21:51 } +2024-07-30 03:46:33,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 227/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 7.4414297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:33,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.65872 samples/s/p 2:21:55 } +2024-07-30 03:46:36,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 229/ 3125], loss: 0.117, per_step_time: 1412ms, lr: 7.438414e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:36,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.66186 samples/s/p 2:21:47 } +2024-07-30 03:46:39,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 231/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 7.4353975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:39,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.65895 samples/s/p 2:21:48 } +2024-07-30 03:46:42,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 233/ 3125], loss: 0.202, per_step_time: 1416ms, lr: 7.432379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:42,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.64702 samples/s/p 2:22:04 } +2024-07-30 03:46:45,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 235/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 7.429359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:45,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.65817 samples/s/p 2:21:44 } +2024-07-30 03:46:47,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 237/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 7.4263385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:47,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.66013 samples/s/p 2:21:38 } +2024-07-30 03:46:50,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 239/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 7.423317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:50,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.65943 samples/s/p 2:21:36 } +2024-07-30 03:46:53,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 241/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 7.4202953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:53,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.66074 samples/s/p 2:21:32 } +2024-07-30 03:46:56,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 243/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 7.4172717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:56,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.65877 samples/s/p 2:21:32 } +2024-07-30 03:46:59,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 245/ 3125], loss: 0.160, per_step_time: 1416ms, lr: 7.4142467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:59,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.64683 samples/s/p 2:21:47 } +2024-07-30 03:47:02,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 247/ 3125], loss: 0.308, per_step_time: 1415ms, lr: 7.4112213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:02,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |█████████████████ | 5.65280 samples/s/p 2:21:35 } +2024-07-30 03:47:04,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 249/ 3125], loss: 0.176, per_step_time: 1413ms, lr: 7.408193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:04,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |█████████████████ | 5.66081 samples/s/p 2:21:20 } +2024-07-30 03:47:07,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 251/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 7.4051645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:07,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.66143 samples/s/p 2:21:17 } +2024-07-30 03:47:10,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 253/ 3125], loss: 0.345, per_step_time: 1415ms, lr: 7.4021355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:10,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.65163 samples/s/p 2:21:28 } +2024-07-30 03:47:13,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 255/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 7.399104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:13,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.65822 samples/s/p 2:21:16 } +2024-07-30 03:47:16,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 257/ 3125], loss: 0.124, per_step_time: 1413ms, lr: 7.396072e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:16,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.65786 samples/s/p 2:21:13 } +2024-07-30 03:47:19,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 259/ 3125], loss: 0.261, per_step_time: 1415ms, lr: 7.393039e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:19,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.65152 samples/s/p 2:21:20 } +2024-07-30 03:47:21,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 261/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 7.3900055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:21,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.65825 samples/s/p 2:21:07 } +2024-07-30 03:47:24,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 263/ 3125], loss: 0.533, per_step_time: 1414ms, lr: 7.3869705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:24,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.65707 samples/s/p 2:21:06 } +2024-07-30 03:47:27,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 265/ 3125], loss: 0.229, per_step_time: 1412ms, lr: 7.383934e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:27,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.66185 samples/s/p 2:20:56 } +2024-07-30 03:47:30,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 267/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 7.380896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:30,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.65858 samples/s/p 2:20:58 } +2024-07-30 03:47:33,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 269/ 3125], loss: 0.090, per_step_time: 1413ms, lr: 7.377857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:33,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.65986 samples/s/p 2:20:53 } +2024-07-30 03:47:36,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 271/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 7.374817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:36,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.65975 samples/s/p 2:20:51 } +2024-07-30 03:47:38,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 273/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 7.371776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:38,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.65874 samples/s/p 2:20:49 } +2024-07-30 03:47:41,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 275/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 7.3687343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:41,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.65851 samples/s/p 2:20:47 } +2024-07-30 03:47:44,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 277/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 7.3656915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:44,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.66141 samples/s/p 2:20:40 } +2024-07-30 03:47:47,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 279/ 3125], loss: 0.249, per_step_time: 1414ms, lr: 7.3626475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:47,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.65756 samples/s/p 2:20:43 } +2024-07-30 03:47:50,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 281/ 3125], loss: 0.255, per_step_time: 1414ms, lr: 7.3596025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:50,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.65696 samples/s/p 2:20:41 } +2024-07-30 03:47:53,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 283/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 7.3565557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:53,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.65856 samples/s/p 2:20:36 } +2024-07-30 03:47:55,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 285/ 3125], loss: 0.257, per_step_time: 1412ms, lr: 7.353507e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:55,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.66176 samples/s/p 2:20:28 } +2024-07-30 03:47:58,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 287/ 3125], loss: 0.273, per_step_time: 1414ms, lr: 7.350459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:58,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.65750 samples/s/p 2:20:31 } +2024-07-30 03:48:01,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 289/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 7.347408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:01,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.65949 samples/s/p 2:20:26 } +2024-07-30 03:48:04,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 291/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 7.344357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:04,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.66033 samples/s/p 2:20:22 } +2024-07-30 03:48:07,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 293/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 7.341305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:07,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.65809 samples/s/p 2:20:22 } +2024-07-30 03:48:10,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 295/ 3125], loss: 0.137, per_step_time: 1413ms, lr: 7.338252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:10,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.65801 samples/s/p 2:20:19 } +2024-07-30 03:48:12,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 297/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 7.3351976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:12,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.66167 samples/s/p 2:20:11 } +2024-07-30 03:48:15,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 299/ 3125], loss: 0.336, per_step_time: 1412ms, lr: 7.3321426e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:15,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.66213 samples/s/p 2:20:08 } +2024-07-30 03:48:18,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 301/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 7.329085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:18,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.65863 samples/s/p 2:20:10 } +2024-07-30 03:48:21,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 303/ 3125], loss: 0.321, per_step_time: 1413ms, lr: 7.3260276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:21,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.65914 samples/s/p 2:20:06 } +2024-07-30 03:48:24,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 305/ 3125], loss: 0.338, per_step_time: 1425ms, lr: 7.3229676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:24,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.61302 samples/s/p 2:21:13 } +2024-07-30 03:48:27,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 307/ 3125], loss: 0.191, per_step_time: 1415ms, lr: 7.319908e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:27,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.65289 samples/s/p 2:20:10 } +2024-07-30 03:48:29,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 309/ 3125], loss: 0.320, per_step_time: 1413ms, lr: 7.3168467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:29,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.66068 samples/s/p 2:19:56 } +2024-07-30 03:48:32,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 311/ 3125], loss: 0.349, per_step_time: 1414ms, lr: 7.313785e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:32,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.65668 samples/s/p 2:19:59 } +2024-07-30 03:48:35,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 313/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 7.3107217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:35,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.66033 samples/s/p 2:19:51 } +2024-07-30 03:48:38,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 315/ 3125], loss: 0.327, per_step_time: 1413ms, lr: 7.307658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:38,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.66083 samples/s/p 2:19:47 } +2024-07-30 03:48:41,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 317/ 3125], loss: 0.287, per_step_time: 1415ms, lr: 7.3045926e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:41,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.65148 samples/s/p 2:19:58 } +2024-07-30 03:48:44,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 319/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 7.301526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:44,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.65866 samples/s/p 2:19:45 } +2024-07-30 03:48:47,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 321/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 7.2984576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:47,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.66170 samples/s/p 2:19:37 } +2024-07-30 03:48:49,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 323/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 7.2953876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:49,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.66046 samples/s/p 2:19:36 } +2024-07-30 03:48:52,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 325/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 7.292318e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:52,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.66116 samples/s/p 2:19:32 } +2024-07-30 03:48:55,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 327/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 7.289247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:55,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.66014 samples/s/p 2:19:31 } +2024-07-30 03:48:58,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 329/ 3125], loss: 0.272, per_step_time: 1414ms, lr: 7.2861753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:58,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.65432 samples/s/p 2:19:37 } +2024-07-30 03:49:01,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 331/ 3125], loss: 0.421, per_step_time: 1412ms, lr: 7.2831026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:01,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.66252 samples/s/p 2:19:22 } +2024-07-30 03:49:04,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 333/ 3125], loss: 0.387, per_step_time: 1413ms, lr: 7.280029e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:04,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.66118 samples/s/p 2:19:21 } +2024-07-30 03:49:06,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 335/ 3125], loss: 0.218, per_step_time: 1412ms, lr: 7.2769526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:06,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.66386 samples/s/p 2:19:14 } +2024-07-30 03:49:09,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 337/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 7.2738767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:09,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.65802 samples/s/p 2:19:20 } +2024-07-30 03:49:12,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 339/ 3125], loss: 0.399, per_step_time: 1413ms, lr: 7.270799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:12,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.65913 samples/s/p 2:19:16 } +2024-07-30 03:49:15,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 341/ 3125], loss: 0.279, per_step_time: 1415ms, lr: 7.2677194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:15,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.65158 samples/s/p 2:19:24 } +2024-07-30 03:49:18,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 343/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 7.2646403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:18,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.66022 samples/s/p 2:19:08 } +2024-07-30 03:49:21,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 345/ 3125], loss: 0.253, per_step_time: 1414ms, lr: 7.2615594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:21,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.65620 samples/s/p 2:19:11 } +2024-07-30 03:49:23,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 347/ 3125], loss: 0.124, per_step_time: 1414ms, lr: 7.2584776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:23,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.65692 samples/s/p 2:19:08 } +2024-07-30 03:49:26,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 349/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 7.255395e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:26,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.65944 samples/s/p 2:19:01 } +2024-07-30 03:49:29,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 351/ 3125], loss: 0.398, per_step_time: 1413ms, lr: 7.2523117e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:29,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.66094 samples/s/p 2:18:56 } +2024-07-30 03:49:32,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 353/ 3125], loss: 0.160, per_step_time: 1414ms, lr: 7.249226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:32,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.65660 samples/s/p 2:18:59 } +2024-07-30 03:49:35,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 355/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 7.2461407e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:35,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.66075 samples/s/p 2:18:51 } +2024-07-30 03:49:38,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 357/ 3125], loss: 0.162, per_step_time: 1414ms, lr: 7.2430526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:38,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.65389 samples/s/p 2:18:58 } +2024-07-30 03:49:40,858 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 359/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 7.2399635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:40,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.65895 samples/s/p 2:18:48 } +2024-07-30 03:49:43,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 361/ 3125], loss: 0.337, per_step_time: 1415ms, lr: 7.236874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:43,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.65367 samples/s/p 2:18:52 } +2024-07-30 03:49:46,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 363/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 7.233784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:46,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.66115 samples/s/p 2:18:39 } +2024-07-30 03:49:49,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 365/ 3125], loss: 0.235, per_step_time: 1412ms, lr: 7.230693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:49,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.66229 samples/s/p 2:18:34 } +2024-07-30 03:49:52,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 367/ 3125], loss: 0.042, per_step_time: 1413ms, lr: 7.2276007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:52,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.66048 samples/s/p 2:18:34 } +2024-07-30 03:49:55,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 369/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 7.224507e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:55,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.66113 samples/s/p 2:18:30 } +2024-07-30 03:49:57,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 371/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 7.221411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:57,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.65883 samples/s/p 2:18:31 } +2024-07-30 03:50:00,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 373/ 3125], loss: 0.220, per_step_time: 1418ms, lr: 7.218316e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:00,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.64021 samples/s/p 2:18:55 } +2024-07-30 03:50:03,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 375/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 7.215219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:03,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.65884 samples/s/p 2:18:25 } +2024-07-30 03:50:06,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 377/ 3125], loss: 0.310, per_step_time: 1415ms, lr: 7.21212e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:06,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.65145 samples/s/p 2:18:33 } +2024-07-30 03:50:09,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 379/ 3125], loss: 0.083, per_step_time: 1413ms, lr: 7.209022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:09,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.66083 samples/s/p 2:18:17 } +2024-07-30 03:50:12,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 381/ 3125], loss: 0.318, per_step_time: 1412ms, lr: 7.205922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:12,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.66209 samples/s/p 2:18:12 } +2024-07-30 03:50:14,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 383/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 7.202821e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:14,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.66014 samples/s/p 2:18:12 } +2024-07-30 03:50:17,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 385/ 3125], loss: 0.288, per_step_time: 1414ms, lr: 7.199719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:17,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.65517 samples/s/p 2:18:16 } +2024-07-30 03:50:20,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 387/ 3125], loss: 0.111, per_step_time: 1414ms, lr: 7.1966165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:20,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.65743 samples/s/p 2:18:10 } +2024-07-30 03:50:23,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 389/ 3125], loss: 0.102, per_step_time: 1415ms, lr: 7.193513e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:23,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.65127 samples/s/p 2:18:16 } +2024-07-30 03:50:26,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 391/ 3125], loss: 0.454, per_step_time: 1413ms, lr: 7.190406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:26,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.65868 samples/s/p 2:18:03 } +2024-07-30 03:50:29,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 393/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 7.1872996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:29,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.66002 samples/s/p 2:17:58 } +2024-07-30 03:50:31,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 395/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 7.184192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:31,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.66076 samples/s/p 2:17:54 } +2024-07-30 03:50:34,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 397/ 3125], loss: 0.102, per_step_time: 1413ms, lr: 7.181084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:34,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.66123 samples/s/p 2:17:50 } +2024-07-30 03:50:37,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 399/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 7.177975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:37,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.66068 samples/s/p 2:17:48 } +2024-07-30 03:50:40,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 401/ 3125], loss: 0.318, per_step_time: 1412ms, lr: 7.174864e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:40,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.66270 samples/s/p 2:17:43 } +2024-07-30 03:50:43,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 403/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 7.1717536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:43,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.65842 samples/s/p 2:17:46 } +2024-07-30 03:50:46,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 405/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 7.168641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:46,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.66027 samples/s/p 2:17:41 } +2024-07-30 03:50:48,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 407/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 7.1655268e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:48,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.65949 samples/s/p 2:17:39 } +2024-07-30 03:50:51,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 409/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 7.162412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:51,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.65998 samples/s/p 2:17:35 } +2024-07-30 03:50:54,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 411/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 7.1592967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:54,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.66165 samples/s/p 2:17:30 } +2024-07-30 03:50:57,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 413/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 7.1561794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:57,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.66057 samples/s/p 2:17:29 } +2024-07-30 03:51:00,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 415/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 7.1530612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:00,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.66026 samples/s/p 2:17:26 } +2024-07-30 03:51:03,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 417/ 3125], loss: 0.052, per_step_time: 1413ms, lr: 7.149943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:03,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.66026 samples/s/p 2:17:24 } +2024-07-30 03:51:05,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 419/ 3125], loss: 0.373, per_step_time: 1413ms, lr: 7.146824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:05,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.65814 samples/s/p 2:17:24 } +2024-07-30 03:51:08,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 421/ 3125], loss: 0.194, per_step_time: 1412ms, lr: 7.1437034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:08,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.66184 samples/s/p 2:17:16 } +2024-07-30 03:51:11,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 423/ 3125], loss: 0.341, per_step_time: 1413ms, lr: 7.1405816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:11,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.65909 samples/s/p 2:17:17 } +2024-07-30 03:51:14,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 425/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 7.137458e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:14,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.65960 samples/s/p 2:17:13 } +2024-07-30 03:51:17,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 427/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 7.1343343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:17,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.65897 samples/s/p 2:17:11 } +2024-07-30 03:51:20,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 429/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 7.131209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:20,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.65897 samples/s/p 2:17:09 } +2024-07-30 03:51:22,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 431/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 7.128083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:22,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.65859 samples/s/p 2:17:06 } +2024-07-30 03:51:25,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 433/ 3125], loss: 0.285, per_step_time: 1414ms, lr: 7.1249565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:25,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.65731 samples/s/p 2:17:05 } +2024-07-30 03:51:28,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 435/ 3125], loss: 0.294, per_step_time: 1414ms, lr: 7.1218287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:28,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.65640 samples/s/p 2:17:04 } +2024-07-30 03:51:31,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 437/ 3125], loss: 0.260, per_step_time: 1414ms, lr: 7.1187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:31,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.65416 samples/s/p 2:17:04 } +2024-07-30 03:51:34,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 439/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 7.11557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:34,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |███████████████████ | 5.65783 samples/s/p 2:16:56 } +2024-07-30 03:51:37,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 441/ 3125], loss: 0.232, per_step_time: 1414ms, lr: 7.1124396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:37,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |███████████████████ | 5.65642 samples/s/p 2:16:55 } +2024-07-30 03:51:39,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 443/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 7.109307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:39,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.66132 samples/s/p 2:16:45 } +2024-07-30 03:51:42,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 445/ 3125], loss: 0.195, per_step_time: 1412ms, lr: 7.106174e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:42,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.66282 samples/s/p 2:16:40 } +2024-07-30 03:51:45,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 447/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 7.103039e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:45,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.65883 samples/s/p 2:16:43 } +2024-07-30 03:51:48,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 449/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 7.0999045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:48,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.65936 samples/s/p 2:16:40 } +2024-07-30 03:51:51,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 451/ 3125], loss: 0.402, per_step_time: 1412ms, lr: 7.0967685e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:51,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.66257 samples/s/p 2:16:32 } +2024-07-30 03:51:54,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 453/ 3125], loss: 0.338, per_step_time: 1414ms, lr: 7.093632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:54,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.65676 samples/s/p 2:16:38 } +2024-07-30 03:51:56,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 455/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 7.0904944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:56,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.66067 samples/s/p 2:16:29 } +2024-07-30 03:51:59,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 457/ 3125], loss: 0.281, per_step_time: 1412ms, lr: 7.0873557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:59,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.66354 samples/s/p 2:16:22 } +2024-07-30 03:52:02,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 459/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 7.0842143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:02,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.66029 samples/s/p 2:16:24 } +2024-07-30 03:52:05,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 461/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 7.081074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:05,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.66067 samples/s/p 2:16:21 } +2024-07-30 03:52:08,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 463/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 7.077932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:08,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.66074 samples/s/p 2:16:18 } +2024-07-30 03:52:11,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 465/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 7.0747888e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:11,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.66123 samples/s/p 2:16:14 } +2024-07-30 03:52:13,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 467/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 7.071645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:13,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.65860 samples/s/p 2:16:15 } +2024-07-30 03:52:16,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 469/ 3125], loss: 0.520, per_step_time: 1413ms, lr: 7.0685005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:16,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.66006 samples/s/p 2:16:10 } +2024-07-30 03:52:19,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 471/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 7.0653537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:19,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.65848 samples/s/p 2:16:10 } +2024-07-30 03:52:22,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 473/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 7.0622073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:22,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.65883 samples/s/p 2:16:07 } +2024-07-30 03:52:25,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 475/ 3125], loss: 0.113, per_step_time: 1413ms, lr: 7.0590595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:25,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.65998 samples/s/p 2:16:02 } +2024-07-30 03:52:28,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 477/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 7.055911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:28,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.65906 samples/s/p 2:16:01 } +2024-07-30 03:52:30,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 479/ 3125], loss: 0.259, per_step_time: 1415ms, lr: 7.0527603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:30,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.65334 samples/s/p 2:16:06 } +2024-07-30 03:52:33,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 481/ 3125], loss: 0.377, per_step_time: 1413ms, lr: 7.0496094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:33,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.65807 samples/s/p 2:15:56 } +2024-07-30 03:52:36,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 483/ 3125], loss: 0.319, per_step_time: 1412ms, lr: 7.046458e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:36,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.66185 samples/s/p 2:15:48 } +2024-07-30 03:52:39,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 485/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 7.043305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:39,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.66124 samples/s/p 2:15:46 } +2024-07-30 03:52:42,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 487/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 7.040151e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:42,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.66016 samples/s/p 2:15:45 } +2024-07-30 03:52:45,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 489/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 7.036997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:45,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.66159 samples/s/p 2:15:40 } +2024-07-30 03:52:47,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 491/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 7.033841e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:47,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.65885 samples/s/p 2:15:41 } +2024-07-30 03:52:50,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 493/ 3125], loss: 0.356, per_step_time: 1413ms, lr: 7.0306837e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:50,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.66090 samples/s/p 2:15:35 } +2024-07-30 03:52:53,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 495/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 7.0275264e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:53,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.66147 samples/s/p 2:15:32 } +2024-07-30 03:52:56,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 497/ 3125], loss: 0.416, per_step_time: 1412ms, lr: 7.0243677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:56,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.66225 samples/s/p 2:15:28 } +2024-07-30 03:52:59,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 499/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 7.0212086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:59,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.66074 samples/s/p 2:15:27 } +2024-07-30 03:53:02,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 501/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 7.018047e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:02,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.65863 samples/s/p 2:15:27 } +2024-07-30 03:53:04,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 503/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 7.014886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:04,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.65673 samples/s/p 2:15:27 } +2024-07-30 03:53:07,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 505/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 7.0117235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:07,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.65924 samples/s/p 2:15:21 } +2024-07-30 03:53:10,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 507/ 3125], loss: 0.252, per_step_time: 1412ms, lr: 7.0085603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:10,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.66235 samples/s/p 2:15:13 } +2024-07-30 03:53:13,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 509/ 3125], loss: 0.103, per_step_time: 1414ms, lr: 7.0053957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:13,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.65444 samples/s/p 2:15:22 } +2024-07-30 03:53:16,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 511/ 3125], loss: 0.140, per_step_time: 1414ms, lr: 7.0022306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:16,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.65507 samples/s/p 2:15:18 } +2024-07-30 03:53:19,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 513/ 3125], loss: 0.333, per_step_time: 1414ms, lr: 6.9990638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:19,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.65714 samples/s/p 2:15:12 } +2024-07-30 03:53:21,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 515/ 3125], loss: 0.159, per_step_time: 1412ms, lr: 6.9958965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:21,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.66237 samples/s/p 2:15:02 } +2024-07-30 03:53:24,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 517/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 6.9927287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:24,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.66034 samples/s/p 2:15:02 } +2024-07-30 03:53:27,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 519/ 3125], loss: 0.437, per_step_time: 1413ms, lr: 6.9895596e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:27,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.66071 samples/s/p 2:14:59 } +2024-07-30 03:53:30,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 521/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 6.9863895e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:30,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.66029 samples/s/p 2:14:57 } +2024-07-30 03:53:33,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 523/ 3125], loss: 0.258, per_step_time: 1420ms, lr: 6.983218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:33,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.63014 samples/s/p 2:15:37 } +2024-07-30 03:53:36,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 525/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 6.980046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:36,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.65916 samples/s/p 2:14:53 } +2024-07-30 03:53:38,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 527/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 6.976873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:38,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.66035 samples/s/p 2:14:48 } +2024-07-30 03:53:41,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 529/ 3125], loss: 0.346, per_step_time: 1413ms, lr: 6.9736993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:41,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.65901 samples/s/p 2:14:47 } +2024-07-30 03:53:44,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 531/ 3125], loss: 0.420, per_step_time: 1413ms, lr: 6.9705247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:44,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.65903 samples/s/p 2:14:44 } +2024-07-30 03:53:47,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 533/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 6.967349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:47,448 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.65783 samples/s/p 2:14:43 } +2024-07-30 03:53:50,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 535/ 3125], loss: 0.098, per_step_time: 1414ms, lr: 6.964172e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:50,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.65383 samples/s/p 2:14:46 } +2024-07-30 03:53:53,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 537/ 3125], loss: 0.678, per_step_time: 1413ms, lr: 6.9609937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:53,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.65833 samples/s/p 2:14:37 } +2024-07-30 03:53:55,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 539/ 3125], loss: 0.108, per_step_time: 1413ms, lr: 6.957816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:55,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.66000 samples/s/p 2:14:32 } +2024-07-30 03:53:58,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 541/ 3125], loss: 0.110, per_step_time: 1413ms, lr: 6.9546363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:58,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.65841 samples/s/p 2:14:31 } +2024-07-30 03:54:01,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 543/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 6.9514554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:01,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.66010 samples/s/p 2:14:26 } +2024-07-30 03:54:04,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 545/ 3125], loss: 0.292, per_step_time: 1413ms, lr: 6.9482744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:04,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.65973 samples/s/p 2:14:23 } +2024-07-30 03:54:07,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 547/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 6.945091e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:07,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.65969 samples/s/p 2:14:21 } +2024-07-30 03:54:10,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 549/ 3125], loss: 0.285, per_step_time: 1412ms, lr: 6.9419084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:10,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.66293 samples/s/p 2:14:13 } +2024-07-30 03:54:12,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 551/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 6.9387243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:12,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.66045 samples/s/p 2:14:14 } +2024-07-30 03:54:15,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 553/ 3125], loss: 0.216, per_step_time: 1418ms, lr: 6.935539e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:15,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.64169 samples/s/p 2:14:38 } +2024-07-30 03:54:18,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 555/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 6.9323532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:18,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.66151 samples/s/p 2:14:07 } +2024-07-30 03:54:21,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 557/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 6.929166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:21,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.65783 samples/s/p 2:14:09 } +2024-07-30 03:54:24,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 559/ 3125], loss: 0.148, per_step_time: 1413ms, lr: 6.9259777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:24,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.65988 samples/s/p 2:14:03 } +2024-07-30 03:54:27,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 561/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 6.9227895e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:27,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.66102 samples/s/p 2:13:59 } +2024-07-30 03:54:29,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 563/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 6.9195994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:29,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.65963 samples/s/p 2:13:58 } +2024-07-30 03:54:32,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 565/ 3125], loss: 0.587, per_step_time: 1413ms, lr: 6.916409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:32,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.65957 samples/s/p 2:13:55 } +2024-07-30 03:54:35,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 567/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 6.913218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:35,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.65855 samples/s/p 2:13:54 } +2024-07-30 03:54:38,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 569/ 3125], loss: 0.142, per_step_time: 1414ms, lr: 6.9100247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:38,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.65766 samples/s/p 2:13:53 } +2024-07-30 03:54:41,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 571/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 6.9068315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:41,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.65921 samples/s/p 2:13:47 } +2024-07-30 03:54:44,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 573/ 3125], loss: 0.064, per_step_time: 1417ms, lr: 6.9036373e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:44,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.64541 samples/s/p 2:14:04 } +2024-07-30 03:54:46,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 575/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 6.9004423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:46,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.66096 samples/s/p 2:13:39 } +2024-07-30 03:54:49,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 577/ 3125], loss: 0.460, per_step_time: 1413ms, lr: 6.8972463e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:49,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.65860 samples/s/p 2:13:40 } +2024-07-30 03:54:52,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 579/ 3125], loss: 0.125, per_step_time: 1413ms, lr: 6.894049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:52,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.66143 samples/s/p 2:13:33 } +2024-07-30 03:54:55,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 581/ 3125], loss: 0.071, per_step_time: 1413ms, lr: 6.8908503e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:55,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.66099 samples/s/p 2:13:31 } +2024-07-30 03:54:58,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 583/ 3125], loss: 0.261, per_step_time: 1414ms, lr: 6.887652e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:58,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.65374 samples/s/p 2:13:38 } +2024-07-30 03:55:01,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 585/ 3125], loss: 0.255, per_step_time: 1414ms, lr: 6.8844524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:01,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.65770 samples/s/p 2:13:30 } +2024-07-30 03:55:03,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 587/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 6.881252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:03,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.66115 samples/s/p 2:13:22 } +2024-07-30 03:55:06,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 589/ 3125], loss: 0.097, per_step_time: 1413ms, lr: 6.8780505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:06,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.65885 samples/s/p 2:13:23 } +2024-07-30 03:55:09,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 591/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 6.8748477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:09,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.65978 samples/s/p 2:13:18 } +2024-07-30 03:55:12,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 593/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 6.8716445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:12,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.66034 samples/s/p 2:13:15 } +2024-07-30 03:55:15,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 595/ 3125], loss: 0.161, per_step_time: 1414ms, lr: 6.8684403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:15,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.65598 samples/s/p 2:13:18 } +2024-07-30 03:55:18,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 597/ 3125], loss: 0.225, per_step_time: 1418ms, lr: 6.8652353e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:18,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.64001 samples/s/p 2:13:38 } +2024-07-30 03:55:21,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 599/ 3125], loss: 0.277, per_step_time: 1426ms, lr: 6.8620293e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:21,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.60807 samples/s/p 2:14:21 } +2024-07-30 03:55:23,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 601/ 3125], loss: 0.352, per_step_time: 1414ms, lr: 6.858822e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:23,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.65725 samples/s/p 2:13:08 } +2024-07-30 03:55:26,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 603/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 6.855614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:26,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.65791 samples/s/p 2:13:04 } +2024-07-30 03:55:29,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 605/ 3125], loss: 0.471, per_step_time: 1413ms, lr: 6.852406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:29,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.65892 samples/s/p 2:13:00 } +2024-07-30 03:55:32,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 607/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 6.8491963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:32,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.65916 samples/s/p 2:12:57 } +2024-07-30 03:55:35,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 609/ 3125], loss: 0.238, per_step_time: 1414ms, lr: 6.8459854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:35,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.65713 samples/s/p 2:12:57 } +2024-07-30 03:55:38,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 611/ 3125], loss: 0.297, per_step_time: 1414ms, lr: 6.8427744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:38,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.65752 samples/s/p 2:12:53 } +2024-07-30 03:55:40,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 613/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 6.8395625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:40,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.65910 samples/s/p 2:12:48 } +2024-07-30 03:55:43,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 615/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 6.836349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:43,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.65977 samples/s/p 2:12:44 } +2024-07-30 03:55:46,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 617/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 6.833135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:46,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.65914 samples/s/p 2:12:43 } +2024-07-30 03:55:49,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 619/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 6.829921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:49,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.66030 samples/s/p 2:12:38 } +2024-07-30 03:55:52,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 621/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 6.826705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:52,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |███████████████████ | 5.66071 samples/s/p 2:12:35 } +2024-07-30 03:55:55,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 623/ 3125], loss: 0.142, per_step_time: 1413ms, lr: 6.823488e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:55,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |███████████████████ | 5.66042 samples/s/p 2:12:32 } +2024-07-30 03:55:57,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 625/ 3125], loss: 0.120, per_step_time: 1413ms, lr: 6.8202708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:57,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.66035 samples/s/p 2:12:30 } +2024-07-30 03:56:00,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 627/ 3125], loss: 0.379, per_step_time: 1414ms, lr: 6.817053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:00,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.65713 samples/s/p 2:12:31 } +2024-07-30 03:56:03,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 629/ 3125], loss: 0.368, per_step_time: 1413ms, lr: 6.8138334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:03,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.65899 samples/s/p 2:12:26 } +2024-07-30 03:56:06,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 631/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 6.8106133e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:06,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.65823 samples/s/p 2:12:24 } +2024-07-30 03:56:09,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 633/ 3125], loss: 0.124, per_step_time: 1413ms, lr: 6.8073928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:09,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.65908 samples/s/p 2:12:20 } +2024-07-30 03:56:12,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 635/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 6.804171e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:12,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.65389 samples/s/p 2:12:24 } +2024-07-30 03:56:14,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 637/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 6.8009476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:14,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.65881 samples/s/p 2:12:15 } +2024-07-30 03:56:17,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 639/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 6.7977244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:17,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.65826 samples/s/p 2:12:13 } +2024-07-30 03:56:20,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 641/ 3125], loss: 0.334, per_step_time: 1413ms, lr: 6.7945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:20,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.66117 samples/s/p 2:12:06 } +2024-07-30 03:56:23,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 643/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 6.7912756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:23,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.66010 samples/s/p 2:12:04 } +2024-07-30 03:56:26,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 645/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 6.788049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:26,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.66113 samples/s/p 2:12:00 } +2024-07-30 03:56:29,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 647/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 6.7848214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:29,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.65910 samples/s/p 2:12:00 } +2024-07-30 03:56:31,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 649/ 3125], loss: 0.085, per_step_time: 1417ms, lr: 6.7815945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:31,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.64224 samples/s/p 2:12:21 } +2024-07-30 03:56:34,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 651/ 3125], loss: 0.368, per_step_time: 1413ms, lr: 6.7783653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:34,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.65908 samples/s/p 2:11:55 } +2024-07-30 03:56:37,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 653/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 6.7751357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:37,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.65950 samples/s/p 2:11:51 } +2024-07-30 03:56:40,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 655/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 6.7719066e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:40,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.66105 samples/s/p 2:11:46 } +2024-07-30 03:56:43,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 657/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 6.768675e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:43,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.66061 samples/s/p 2:11:44 } +2024-07-30 03:56:46,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 659/ 3125], loss: 0.151, per_step_time: 1413ms, lr: 6.7654423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:46,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.66031 samples/s/p 2:11:42 } +2024-07-30 03:56:48,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 661/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 6.76221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:48,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.66014 samples/s/p 2:11:39 } +2024-07-30 03:56:51,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 663/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 6.7589763e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:51,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.65954 samples/s/p 2:11:37 } +2024-07-30 03:56:54,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 665/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 6.7557417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:54,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.65991 samples/s/p 2:11:34 } +2024-07-30 03:56:57,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 667/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 6.752506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:57,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.66044 samples/s/p 2:11:30 } +2024-07-30 03:57:00,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 669/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 6.7492706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:00,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.65984 samples/s/p 2:11:28 } +2024-07-30 03:57:03,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 671/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 6.7460333e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:03,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.66073 samples/s/p 2:11:24 } +2024-07-30 03:57:05,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 673/ 3125], loss: 0.298, per_step_time: 1412ms, lr: 6.742795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:05,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.66184 samples/s/p 2:11:20 } +2024-07-30 03:57:08,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 675/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 6.7395567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:08,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.65833 samples/s/p 2:11:22 } +2024-07-30 03:57:11,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 677/ 3125], loss: 0.427, per_step_time: 1413ms, lr: 6.736317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:11,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.65798 samples/s/p 2:11:19 } +2024-07-30 03:57:14,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 679/ 3125], loss: 0.160, per_step_time: 1414ms, lr: 6.733077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:14,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.65462 samples/s/p 2:11:21 } +2024-07-30 03:57:17,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 681/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 6.7298356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:17,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.65781 samples/s/p 2:11:14 } +2024-07-30 03:57:20,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 683/ 3125], loss: 0.352, per_step_time: 1414ms, lr: 6.7265933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:20,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.65668 samples/s/p 2:11:13 } +2024-07-30 03:57:22,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 685/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 6.723351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:22,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.66006 samples/s/p 2:11:05 } +2024-07-30 03:57:25,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 687/ 3125], loss: 0.426, per_step_time: 1413ms, lr: 6.7201063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:25,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.65916 samples/s/p 2:11:04 } +2024-07-30 03:57:28,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 689/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 6.7168626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:28,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.65953 samples/s/p 2:11:00 } +2024-07-30 03:57:31,405 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 691/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 6.7136175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:31,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.66099 samples/s/p 2:10:55 } +2024-07-30 03:57:34,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 693/ 3125], loss: 0.261, per_step_time: 1414ms, lr: 6.710371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:34,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.65507 samples/s/p 2:11:01 } +2024-07-30 03:57:37,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 695/ 3125], loss: 0.328, per_step_time: 1417ms, lr: 6.707124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:37,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.64531 samples/s/p 2:11:12 } +2024-07-30 03:57:39,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 697/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 6.703876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:39,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.65839 samples/s/p 2:10:50 } +2024-07-30 03:57:42,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 699/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 6.700628e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:42,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.65802 samples/s/p 2:10:48 } +2024-07-30 03:57:45,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 701/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 6.6973794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:45,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.66066 samples/s/p 2:10:42 } +2024-07-30 03:57:48,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 703/ 3125], loss: 0.323, per_step_time: 1414ms, lr: 6.6941284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:48,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.65658 samples/s/p 2:10:45 } +2024-07-30 03:57:51,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 705/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 6.690877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:51,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.65926 samples/s/p 2:10:38 } +2024-07-30 03:57:54,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 707/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 6.6876255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:54,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.66132 samples/s/p 2:10:32 } +2024-07-30 03:57:56,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 709/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 6.6843727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:56,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.66155 samples/s/p 2:10:29 } +2024-07-30 03:57:59,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 711/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 6.681119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:59,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.66028 samples/s/p 2:10:28 } +2024-07-30 03:58:02,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 713/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 6.6778657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:02,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.65999 samples/s/p 2:10:26 } +2024-07-30 03:58:05,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 715/ 3125], loss: 0.368, per_step_time: 1412ms, lr: 6.67461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:05,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.66194 samples/s/p 2:10:20 } +2024-07-30 03:58:08,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 717/ 3125], loss: 0.139, per_step_time: 1412ms, lr: 6.671354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:08,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.66251 samples/s/p 2:10:17 } +2024-07-30 03:58:11,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 719/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 6.6680977e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:11,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.66082 samples/s/p 2:10:16 } +2024-07-30 03:58:13,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 721/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 6.6648404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:13,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.66066 samples/s/p 2:10:13 } +2024-07-30 03:58:16,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 723/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 6.6615817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:16,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.65797 samples/s/p 2:10:14 } +2024-07-30 03:58:19,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 725/ 3125], loss: 0.420, per_step_time: 1416ms, lr: 6.6583234e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:19,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.64859 samples/s/p 2:10:24 } +2024-07-30 03:58:22,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 727/ 3125], loss: 0.105, per_step_time: 1414ms, lr: 6.6550633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:22,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.65569 samples/s/p 2:10:12 } +2024-07-30 03:58:25,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 729/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 6.6518032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:25,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.66074 samples/s/p 2:10:02 } +2024-07-30 03:58:28,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 731/ 3125], loss: 0.259, per_step_time: 1412ms, lr: 6.648541e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:28,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.66232 samples/s/p 2:09:57 } +2024-07-30 03:58:30,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 733/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 6.6452794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:30,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.66105 samples/s/p 2:09:56 } +2024-07-30 03:58:33,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 735/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 6.6420166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:33,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.66009 samples/s/p 2:09:54 } +2024-07-30 03:58:36,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 737/ 3125], loss: 0.189, per_step_time: 1414ms, lr: 6.6387524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:36,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.65640 samples/s/p 2:09:57 } +2024-07-30 03:58:39,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 739/ 3125], loss: 0.179, per_step_time: 1414ms, lr: 6.6354874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:39,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.65536 samples/s/p 2:09:55 } +2024-07-30 03:58:42,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 741/ 3125], loss: 0.483, per_step_time: 1413ms, lr: 6.632223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:42,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.65922 samples/s/p 2:09:47 } +2024-07-30 03:58:45,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 743/ 3125], loss: 0.356, per_step_time: 1414ms, lr: 6.6289567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:45,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.65726 samples/s/p 2:09:47 } +2024-07-30 03:58:47,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 745/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 6.62569e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:47,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.66100 samples/s/p 2:09:39 } +2024-07-30 03:58:50,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 747/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 6.622422e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:50,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.65938 samples/s/p 2:09:38 } +2024-07-30 03:58:53,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 749/ 3125], loss: 0.377, per_step_time: 1413ms, lr: 6.6191533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:53,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.66054 samples/s/p 2:09:34 } +2024-07-30 03:58:56,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 751/ 3125], loss: 0.137, per_step_time: 1413ms, lr: 6.6158846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:56,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.66022 samples/s/p 2:09:32 } +2024-07-30 03:58:59,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 753/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 6.612614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:59,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.66114 samples/s/p 2:09:28 } +2024-07-30 03:59:02,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 755/ 3125], loss: 0.384, per_step_time: 1413ms, lr: 6.6093444e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:02,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.66059 samples/s/p 2:09:25 } +2024-07-30 03:59:04,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 757/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 6.6060725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:04,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.66149 samples/s/p 2:09:21 } +2024-07-30 03:59:07,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 759/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 6.6028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:07,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.66119 samples/s/p 2:09:19 } +2024-07-30 03:59:10,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 761/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 6.599527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:10,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.66164 samples/s/p 2:09:16 } +2024-07-30 03:59:13,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 763/ 3125], loss: 0.551, per_step_time: 1413ms, lr: 6.5962536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:13,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.66035 samples/s/p 2:09:15 } +2024-07-30 03:59:16,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 765/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 6.5929794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:16,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.65951 samples/s/p 2:09:13 } +2024-07-30 03:59:19,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 767/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 6.5897034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:19,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.65987 samples/s/p 2:09:09 } +2024-07-30 03:59:21,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 769/ 3125], loss: 0.385, per_step_time: 1413ms, lr: 6.5864274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:21,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.65909 samples/s/p 2:09:08 } +2024-07-30 03:59:24,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 771/ 3125], loss: 0.358, per_step_time: 1415ms, lr: 6.5831505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:24,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.65259 samples/s/p 2:09:14 } +2024-07-30 03:59:27,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 773/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 6.5798736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:27,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.65956 samples/s/p 2:09:01 } +2024-07-30 03:59:30,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 775/ 3125], loss: 0.327, per_step_time: 1413ms, lr: 6.5765944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:30,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.66151 samples/s/p 2:08:56 } +2024-07-30 03:59:33,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 777/ 3125], loss: 0.330, per_step_time: 1413ms, lr: 6.5733157e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:33,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.65883 samples/s/p 2:08:57 } +2024-07-30 03:59:36,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 779/ 3125], loss: 0.209, per_step_time: 1414ms, lr: 6.570036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:36,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.65770 samples/s/p 2:08:56 } +2024-07-30 03:59:38,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 781/ 3125], loss: 0.368, per_step_time: 1412ms, lr: 6.5667555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:38,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.66191 samples/s/p 2:08:47 } +2024-07-30 03:59:41,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 783/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 6.5634736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:41,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.66063 samples/s/p 2:08:46 } +2024-07-30 03:59:44,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 785/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 6.560192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:44,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.65890 samples/s/p 2:08:45 } +2024-07-30 03:59:47,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 787/ 3125], loss: 0.200, per_step_time: 1414ms, lr: 6.556909e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:47,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.65494 samples/s/p 2:08:48 } +2024-07-30 03:59:50,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 789/ 3125], loss: 0.394, per_step_time: 1413ms, lr: 6.553625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:50,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.65859 samples/s/p 2:08:40 } +2024-07-30 03:59:53,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 791/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 6.550342e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:53,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.66068 samples/s/p 2:08:34 } +2024-07-30 03:59:55,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 793/ 3125], loss: 0.298, per_step_time: 1414ms, lr: 6.5470563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:55,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.65694 samples/s/p 2:08:37 } +2024-07-30 03:59:58,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 795/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 6.5437703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:58,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.66001 samples/s/p 2:08:30 } +2024-07-30 04:00:01,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 797/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 6.540484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:01,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.65927 samples/s/p 2:08:28 } +2024-07-30 04:00:04,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 799/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 6.5371964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:04,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.66005 samples/s/p 2:08:24 } +2024-07-30 04:00:07,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 801/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 6.5339086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:07,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.66111 samples/s/p 2:08:20 } +2024-07-30 04:00:10,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 803/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 6.53062e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:10,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.66122 samples/s/p 2:08:17 } +2024-07-30 04:00:13,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 805/ 3125], loss: 0.134, per_step_time: 1413ms, lr: 6.5273302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:13,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.65849 samples/s/p 2:08:18 } +2024-07-30 04:00:15,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 807/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 6.5240406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:15,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.65872 samples/s/p 2:08:15 } +2024-07-30 04:00:18,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 809/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 6.5207496e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:18,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |████████████████████ | 5.66038 samples/s/p 2:08:09 } +2024-07-30 04:00:21,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 811/ 3125], loss: 0.194, per_step_time: 1412ms, lr: 6.5174577e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:21,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |████████████████████ | 5.66273 samples/s/p 2:08:03 } +2024-07-30 04:00:24,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 813/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 6.5141653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:24,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.66036 samples/s/p 2:08:04 } +2024-07-30 04:00:27,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 815/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 6.510872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:27,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.66085 samples/s/p 2:08:00 } +2024-07-30 04:00:30,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 817/ 3125], loss: 0.292, per_step_time: 1413ms, lr: 6.507578e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:30,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.66029 samples/s/p 2:07:58 } +2024-07-30 04:00:32,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 819/ 3125], loss: 0.129, per_step_time: 1413ms, lr: 6.504284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:32,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.65912 samples/s/p 2:07:57 } +2024-07-30 04:00:35,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 821/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 6.500989e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:35,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.66128 samples/s/p 2:07:51 } +2024-07-30 04:00:38,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 823/ 3125], loss: 0.091, per_step_time: 1413ms, lr: 6.497693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:38,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.65866 samples/s/p 2:07:52 } +2024-07-30 04:00:41,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 825/ 3125], loss: 0.179, per_step_time: 1412ms, lr: 6.494396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:41,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.66347 samples/s/p 2:07:43 } +2024-07-30 04:00:44,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 827/ 3125], loss: 0.490, per_step_time: 1413ms, lr: 6.4910982e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:44,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.66071 samples/s/p 2:07:44 } +2024-07-30 04:00:47,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 829/ 3125], loss: 0.243, per_step_time: 1412ms, lr: 6.4878004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:47,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.66214 samples/s/p 2:07:39 } +2024-07-30 04:00:49,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 831/ 3125], loss: 0.435, per_step_time: 1413ms, lr: 6.4845017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:49,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.66045 samples/s/p 2:07:38 } +2024-07-30 04:00:52,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 833/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 6.481202e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:52,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.65992 samples/s/p 2:07:36 } +2024-07-30 04:00:55,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 835/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 6.4779024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:55,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.65941 samples/s/p 2:07:34 } +2024-07-30 04:00:58,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 837/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 6.474601e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:58,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.65777 samples/s/p 2:07:33 } +2024-07-30 04:01:01,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 839/ 3125], loss: 0.248, per_step_time: 1412ms, lr: 6.4712985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:01,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.66176 samples/s/p 2:07:25 } +2024-07-30 04:01:04,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 841/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 6.4679966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:04,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.66081 samples/s/p 2:07:24 } +2024-07-30 04:01:06,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 843/ 3125], loss: 0.422, per_step_time: 1414ms, lr: 6.464694e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:06,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.65659 samples/s/p 2:07:27 } +2024-07-30 04:01:09,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 845/ 3125], loss: 0.138, per_step_time: 1412ms, lr: 6.4613905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:09,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.66249 samples/s/p 2:07:16 } +2024-07-30 04:01:12,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 847/ 3125], loss: 0.428, per_step_time: 1414ms, lr: 6.4580854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:12,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.65654 samples/s/p 2:07:21 } +2024-07-30 04:01:15,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 849/ 3125], loss: 0.190, per_step_time: 1414ms, lr: 6.4547808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:15,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.65688 samples/s/p 2:07:18 } +2024-07-30 04:01:18,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 851/ 3125], loss: 0.377, per_step_time: 1414ms, lr: 6.4514747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:18,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.65642 samples/s/p 2:07:15 } +2024-07-30 04:01:21,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 853/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 6.448168e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:21,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.65372 samples/s/p 2:07:16 } +2024-07-30 04:01:23,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 855/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 6.4448614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:23,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.65971 samples/s/p 2:07:05 } +2024-07-30 04:01:26,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 857/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 6.4415535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:26,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.66102 samples/s/p 2:07:01 } +2024-07-30 04:01:29,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 859/ 3125], loss: 0.122, per_step_time: 1413ms, lr: 6.4382443e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:29,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.65988 samples/s/p 2:06:59 } +2024-07-30 04:01:32,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 861/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 6.434935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:32,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.66066 samples/s/p 2:06:56 } +2024-07-30 04:01:35,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 863/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 6.4316255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:35,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.66057 samples/s/p 2:06:53 } +2024-07-30 04:01:38,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 865/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 6.428315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:38,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.65882 samples/s/p 2:06:52 } +2024-07-30 04:01:40,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 867/ 3125], loss: 0.485, per_step_time: 1414ms, lr: 6.425004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:40,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.65641 samples/s/p 2:06:53 } +2024-07-30 04:01:43,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 869/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 6.4216915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:43,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.65887 samples/s/p 2:06:47 } +2024-07-30 04:01:46,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 871/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 6.4183782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:46,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.66136 samples/s/p 2:06:40 } +2024-07-30 04:01:49,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 873/ 3125], loss: 0.219, per_step_time: 1414ms, lr: 6.4150654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:49,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.65708 samples/s/p 2:06:43 } +2024-07-30 04:01:52,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 875/ 3125], loss: 0.493, per_step_time: 1413ms, lr: 6.411751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:52,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.66009 samples/s/p 2:06:37 } +2024-07-30 04:01:55,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 877/ 3125], loss: 0.635, per_step_time: 1413ms, lr: 6.408436e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:55,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.66056 samples/s/p 2:06:33 } +2024-07-30 04:01:57,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 879/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 6.4051214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:57,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.66025 samples/s/p 2:06:31 } +2024-07-30 04:02:00,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 881/ 3125], loss: 0.363, per_step_time: 1413ms, lr: 6.401805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:00,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.66104 samples/s/p 2:06:27 } +2024-07-30 04:02:03,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 883/ 3125], loss: 0.295, per_step_time: 1425ms, lr: 6.398488e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:03,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.61132 samples/s/p 2:07:31 } +2024-07-30 04:02:06,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 885/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 6.3951707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:06,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.66103 samples/s/p 2:06:21 } +2024-07-30 04:02:09,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 887/ 3125], loss: 0.270, per_step_time: 1414ms, lr: 6.391853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:09,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.65601 samples/s/p 2:06:25 } +2024-07-30 04:02:12,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 889/ 3125], loss: 0.163, per_step_time: 1417ms, lr: 6.388534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:12,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.64552 samples/s/p 2:06:36 } +2024-07-30 04:02:14,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 891/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 6.385215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:14,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.65832 samples/s/p 2:06:16 } +2024-07-30 04:02:17,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 893/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 6.3818943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:17,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.66073 samples/s/p 2:06:10 } +2024-07-30 04:02:20,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 895/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 6.378574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:20,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.66102 samples/s/p 2:06:07 } +2024-07-30 04:02:23,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 897/ 3125], loss: 0.250, per_step_time: 1412ms, lr: 6.3752523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:23,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.66202 samples/s/p 2:06:03 } +2024-07-30 04:02:26,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 899/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 6.371931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:26,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.65849 samples/s/p 2:06:05 } +2024-07-30 04:02:29,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 901/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 6.3686084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:29,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.66149 samples/s/p 2:05:58 } +2024-07-30 04:02:31,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 903/ 3125], loss: 0.049, per_step_time: 1413ms, lr: 6.3652847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:31,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.66066 samples/s/p 2:05:56 } +2024-07-30 04:02:34,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 905/ 3125], loss: 0.419, per_step_time: 1413ms, lr: 6.36196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:34,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.66125 samples/s/p 2:05:53 } +2024-07-30 04:02:37,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 907/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 6.358636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:37,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.65940 samples/s/p 2:05:52 } +2024-07-30 04:02:40,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 909/ 3125], loss: 0.149, per_step_time: 1426ms, lr: 6.3553107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:40,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.60973 samples/s/p 2:06:56 } +2024-07-30 04:02:43,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 911/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 6.3519847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:43,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.66127 samples/s/p 2:05:44 } +2024-07-30 04:02:46,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 913/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 6.3486586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:46,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.66146 samples/s/p 2:05:41 } +2024-07-30 04:02:48,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 915/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 6.345331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:48,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.66150 samples/s/p 2:05:38 } +2024-07-30 04:02:51,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 917/ 3125], loss: 0.467, per_step_time: 1413ms, lr: 6.342003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:51,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.65859 samples/s/p 2:05:39 } +2024-07-30 04:02:54,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 919/ 3125], loss: 0.285, per_step_time: 1414ms, lr: 6.338674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:54,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.65745 samples/s/p 2:05:38 } +2024-07-30 04:02:57,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 921/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 6.3353455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:57,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.66165 samples/s/p 2:05:29 } +2024-07-30 04:03:00,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 923/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 6.332016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:00,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.66053 samples/s/p 2:05:28 } +2024-07-30 04:03:03,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 925/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 6.3286852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:03,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.66138 samples/s/p 2:05:24 } +2024-07-30 04:03:05,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 927/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 6.3253538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:05,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.65930 samples/s/p 2:05:24 } +2024-07-30 04:03:08,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 929/ 3125], loss: 0.325, per_step_time: 1414ms, lr: 6.3220227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:08,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.65519 samples/s/p 2:05:27 } +2024-07-30 04:03:11,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 931/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 6.318691e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:11,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.65818 samples/s/p 2:05:20 } +2024-07-30 04:03:14,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 933/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 6.315357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:14,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.65823 samples/s/p 2:05:17 } +2024-07-30 04:03:17,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 935/ 3125], loss: 0.239, per_step_time: 1414ms, lr: 6.3120237e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:17,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.65660 samples/s/p 2:05:16 } +2024-07-30 04:03:20,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 937/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 6.308689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:20,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.65906 samples/s/p 2:05:10 } +2024-07-30 04:03:22,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 939/ 3125], loss: 0.109, per_step_time: 1412ms, lr: 6.305355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:22,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.66251 samples/s/p 2:05:03 } +2024-07-30 04:03:25,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 941/ 3125], loss: 0.261, per_step_time: 1412ms, lr: 6.3020193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:25,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.66295 samples/s/p 2:04:59 } +2024-07-30 04:03:28,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 943/ 3125], loss: 0.153, per_step_time: 1419ms, lr: 6.2986833e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:28,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.63465 samples/s/p 2:05:34 } +2024-07-30 04:03:31,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 945/ 3125], loss: 0.131, per_step_time: 1414ms, lr: 6.2953472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:31,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.65766 samples/s/p 2:05:01 } +2024-07-30 04:03:34,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 947/ 3125], loss: 0.170, per_step_time: 1417ms, lr: 6.2920094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:34,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.64231 samples/s/p 2:05:18 } +2024-07-30 04:03:37,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 949/ 3125], loss: 0.456, per_step_time: 1413ms, lr: 6.2886706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:37,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.66032 samples/s/p 2:04:52 } +2024-07-30 04:03:39,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 951/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 6.2853323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:39,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.66136 samples/s/p 2:04:47 } +2024-07-30 04:03:42,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 953/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 6.281994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:42,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.65892 samples/s/p 2:04:48 } +2024-07-30 04:03:45,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 955/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 6.2786535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:45,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.66123 samples/s/p 2:04:42 } +2024-07-30 04:03:48,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 957/ 3125], loss: 0.221, per_step_time: 1414ms, lr: 6.2753134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:48,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.65757 samples/s/p 2:04:44 } +2024-07-30 04:03:51,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 959/ 3125], loss: 0.198, per_step_time: 1414ms, lr: 6.2719723e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:51,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.65531 samples/s/p 2:04:44 } +2024-07-30 04:03:54,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 961/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 6.2686304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:54,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.66153 samples/s/p 2:04:33 } +2024-07-30 04:03:56,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 963/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 6.2652884e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:56,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.66069 samples/s/p 2:04:31 } +2024-07-30 04:03:59,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 965/ 3125], loss: 0.207, per_step_time: 1412ms, lr: 6.2619456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:59,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.66217 samples/s/p 2:04:27 } +2024-07-30 04:04:02,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 967/ 3125], loss: 0.455, per_step_time: 1413ms, lr: 6.2586028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:02,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.65872 samples/s/p 2:04:28 } +2024-07-30 04:04:05,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 969/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 6.255258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:05,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.66043 samples/s/p 2:04:23 } +2024-07-30 04:04:08,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 971/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 6.2519143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:08,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.65981 samples/s/p 2:04:21 } +2024-07-30 04:04:11,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 973/ 3125], loss: 0.444, per_step_time: 1414ms, lr: 6.2485683e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:11,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.65714 samples/s/p 2:04:22 } +2024-07-30 04:04:13,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 975/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 6.245223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:13,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.66081 samples/s/p 2:04:14 } +2024-07-30 04:04:16,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 977/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 6.2418762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:16,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.66055 samples/s/p 2:04:12 } +2024-07-30 04:04:19,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 979/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 6.2385297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:19,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.65949 samples/s/p 2:04:10 } +2024-07-30 04:04:22,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 981/ 3125], loss: 0.238, per_step_time: 1414ms, lr: 6.2351824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:22,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.65715 samples/s/p 2:04:11 } +2024-07-30 04:04:25,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 983/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 6.2318336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:25,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.65766 samples/s/p 2:04:07 } +2024-07-30 04:04:28,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 985/ 3125], loss: 0.249, per_step_time: 1414ms, lr: 6.228485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:28,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.65522 samples/s/p 2:04:07 } +2024-07-30 04:04:30,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 987/ 3125], loss: 0.120, per_step_time: 1414ms, lr: 6.2251356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:30,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.65753 samples/s/p 2:04:02 } +2024-07-30 04:04:33,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 989/ 3125], loss: 0.135, per_step_time: 1418ms, lr: 6.221786e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:33,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.64088 samples/s/p 2:04:21 } +2024-07-30 04:04:36,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 991/ 3125], loss: 0.239, per_step_time: 1412ms, lr: 6.218435e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:36,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.66192 samples/s/p 2:03:50 } +2024-07-30 04:04:39,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 993/ 3125], loss: 0.431, per_step_time: 1415ms, lr: 6.215085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:39,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.65082 samples/s/p 2:04:02 } +2024-07-30 04:04:42,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 995/ 3125], loss: 0.215, per_step_time: 1417ms, lr: 6.2117324e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:42,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.64284 samples/s/p 2:04:10 } +2024-07-30 04:04:45,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 997/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 6.2083805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:45,178 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |█████████████████████ | 5.66136 samples/s/p 2:03:42 } +2024-07-30 04:04:48,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 999/ 3125], loss: 0.067, per_step_time: 1413ms, lr: 6.205027e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:48,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |█████████████████████ | 5.65826 samples/s/p 2:03:44 } +2024-07-30 04:04:50,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1001/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 6.2016743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:50,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.65921 samples/s/p 2:03:40 } +2024-07-30 04:04:53,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1003/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 6.19832e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:53,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.65896 samples/s/p 2:03:37 } +2024-07-30 04:04:56,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1005/ 3125], loss: 0.246, per_step_time: 1412ms, lr: 6.194966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:56,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.66204 samples/s/p 2:03:30 } +2024-07-30 04:04:59,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1007/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 6.19161e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:59,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.65789 samples/s/p 2:03:33 } +2024-07-30 04:05:02,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1009/ 3125], loss: 0.139, per_step_time: 1413ms, lr: 6.1882547e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:02,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.66063 samples/s/p 2:03:26 } +2024-07-30 04:05:05,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1011/ 3125], loss: 0.428, per_step_time: 1418ms, lr: 6.1848987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:05,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.63848 samples/s/p 2:03:53 } +2024-07-30 04:05:07,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1013/ 3125], loss: 0.426, per_step_time: 1417ms, lr: 6.1815417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:07,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.64386 samples/s/p 2:03:43 } +2024-07-30 04:05:10,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1015/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 6.178185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:10,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.66045 samples/s/p 2:03:18 } +2024-07-30 04:05:13,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1017/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 6.174826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:13,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.65858 samples/s/p 2:03:18 } +2024-07-30 04:05:16,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1019/ 3125], loss: 0.236, per_step_time: 1414ms, lr: 6.1714672e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:16,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.65746 samples/s/p 2:03:16 } +2024-07-30 04:05:19,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1021/ 3125], loss: 0.113, per_step_time: 1413ms, lr: 6.1681085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:19,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.66132 samples/s/p 2:03:09 } +2024-07-30 04:05:22,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1023/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 6.1647493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:22,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.65997 samples/s/p 2:03:08 } +2024-07-30 04:05:24,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1025/ 3125], loss: 0.211, per_step_time: 1414ms, lr: 6.161389e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:24,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.65417 samples/s/p 2:03:12 } +2024-07-30 04:05:27,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1027/ 3125], loss: 0.275, per_step_time: 1414ms, lr: 6.158028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:27,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.65648 samples/s/p 2:03:06 } +2024-07-30 04:05:30,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1029/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 6.1546666e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:30,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.65994 samples/s/p 2:02:59 } +2024-07-30 04:05:33,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1031/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 6.1513047e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:33,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.65857 samples/s/p 2:02:58 } +2024-07-30 04:05:36,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1033/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 6.147943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:36,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.66027 samples/s/p 2:02:53 } +2024-07-30 04:05:39,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1035/ 3125], loss: 0.040, per_step_time: 1412ms, lr: 6.1445794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:39,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.66213 samples/s/p 2:02:48 } +2024-07-30 04:05:41,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1037/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 6.1412165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:41,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.66024 samples/s/p 2:02:47 } +2024-07-30 04:05:44,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1039/ 3125], loss: 0.218, per_step_time: 1412ms, lr: 6.137852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:44,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.66196 samples/s/p 2:02:42 } +2024-07-30 04:05:47,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1041/ 3125], loss: 0.147, per_step_time: 1412ms, lr: 6.134487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:47,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.66174 samples/s/p 2:02:40 } +2024-07-30 04:05:50,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1043/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 6.131122e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:50,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.66016 samples/s/p 2:02:39 } +2024-07-30 04:05:53,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1045/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 6.1277565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:53,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.66098 samples/s/p 2:02:35 } +2024-07-30 04:05:56,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1047/ 3125], loss: 0.124, per_step_time: 1413ms, lr: 6.124391e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:56,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.65929 samples/s/p 2:02:34 } +2024-07-30 04:05:58,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1049/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 6.121024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:58,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.65779 samples/s/p 2:02:34 } +2024-07-30 04:06:01,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1051/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 6.117656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:01,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.65831 samples/s/p 2:02:30 } +2024-07-30 04:06:04,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1053/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 6.114288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:04,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.65784 samples/s/p 2:02:28 } +2024-07-30 04:06:07,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1055/ 3125], loss: 0.335, per_step_time: 1413ms, lr: 6.1109204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:07,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.66012 samples/s/p 2:02:22 } +2024-07-30 04:06:10,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1057/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 6.107551e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:10,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.66016 samples/s/p 2:02:19 } +2024-07-30 04:06:13,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1059/ 3125], loss: 0.107, per_step_time: 1412ms, lr: 6.1041824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:13,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.66224 samples/s/p 2:02:14 } +2024-07-30 04:06:15,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1061/ 3125], loss: 0.301, per_step_time: 1412ms, lr: 6.100812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:15,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.66199 samples/s/p 2:02:11 } +2024-07-30 04:06:18,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1063/ 3125], loss: 0.454, per_step_time: 1412ms, lr: 6.097441e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:18,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.66193 samples/s/p 2:02:08 } +2024-07-30 04:06:21,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1065/ 3125], loss: 0.363, per_step_time: 1413ms, lr: 6.0940706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:21,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.66030 samples/s/p 2:02:08 } +2024-07-30 04:06:24,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1067/ 3125], loss: 0.380, per_step_time: 1413ms, lr: 6.090699e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:24,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.65922 samples/s/p 2:02:06 } +2024-07-30 04:06:27,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1069/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 6.0873276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:27,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.66166 samples/s/p 2:02:00 } +2024-07-30 04:06:30,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1071/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 6.083955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:30,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.66136 samples/s/p 2:01:58 } +2024-07-30 04:06:32,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1073/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 6.0805814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:32,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.66011 samples/s/p 2:01:57 } +2024-07-30 04:06:35,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1075/ 3125], loss: 0.729, per_step_time: 1413ms, lr: 6.0772086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:35,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.65788 samples/s/p 2:01:57 } +2024-07-30 04:06:35,720 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 04:07:10,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1077/ 3125], loss: 0.403, per_step_time: 1415ms, lr: 6.0738334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:10,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.65078 samples/s/p 2:02:03 } +2024-07-30 04:07:13,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1079/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 6.070459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:13,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.66016 samples/s/p 2:01:48 } +2024-07-30 04:07:16,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1081/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 6.0670845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:16,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.65998 samples/s/p 2:01:46 } +2024-07-30 04:07:18,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1083/ 3125], loss: 0.350, per_step_time: 1414ms, lr: 6.0637085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:18,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.65727 samples/s/p 2:01:46 } +2024-07-30 04:07:21,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1085/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 6.060332e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:21,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.66079 samples/s/p 2:01:39 } +2024-07-30 04:07:24,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1087/ 3125], loss: 0.442, per_step_time: 1413ms, lr: 6.056956e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:24,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.65772 samples/s/p 2:01:40 } +2024-07-30 04:07:27,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1089/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 6.0535785e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:27,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.65885 samples/s/p 2:01:36 } +2024-07-30 04:07:30,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1091/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 6.0502007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:30,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.65905 samples/s/p 2:01:33 } +2024-07-30 04:07:33,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1093/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 6.0468233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:33,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.66123 samples/s/p 2:01:27 } +2024-07-30 04:07:35,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1095/ 3125], loss: 0.273, per_step_time: 1415ms, lr: 6.043444e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:35,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.64974 samples/s/p 2:01:39 } +2024-07-30 04:07:38,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1097/ 3125], loss: 0.269, per_step_time: 1415ms, lr: 6.0400653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:38,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.65009 samples/s/p 2:01:36 } +2024-07-30 04:07:41,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1099/ 3125], loss: 0.246, per_step_time: 1414ms, lr: 6.0366856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:41,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.65703 samples/s/p 2:01:24 } +2024-07-30 04:07:44,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1101/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 6.0333055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:44,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.66010 samples/s/p 2:01:17 } +2024-07-30 04:07:47,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1103/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 6.0299253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:47,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.66107 samples/s/p 2:01:13 } +2024-07-30 04:07:50,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1105/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 6.026544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:50,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.65851 samples/s/p 2:01:13 } +2024-07-30 04:07:52,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1107/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 6.023162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:52,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.65831 samples/s/p 2:01:11 } +2024-07-30 04:07:55,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1109/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 6.01978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:55,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.66157 samples/s/p 2:01:04 } +2024-07-30 04:07:58,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1111/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 6.016398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:58,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.65929 samples/s/p 2:01:04 } +2024-07-30 04:08:01,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1113/ 3125], loss: 0.096, per_step_time: 1413ms, lr: 6.013014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:01,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.66008 samples/s/p 2:01:00 } +2024-07-30 04:08:04,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1115/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 6.009631e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:04,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.66002 samples/s/p 2:00:57 } +2024-07-30 04:08:07,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1117/ 3125], loss: 0.078, per_step_time: 1413ms, lr: 6.0062466e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:07,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.65939 samples/s/p 2:00:55 } +2024-07-30 04:08:09,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1119/ 3125], loss: 0.270, per_step_time: 1414ms, lr: 6.0028624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:09,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.65573 samples/s/p 2:00:57 } +2024-07-30 04:08:12,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1121/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 5.9994773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:12,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.66058 samples/s/p 2:00:48 } +2024-07-30 04:08:15,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1123/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 5.9960917e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:15,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.65838 samples/s/p 2:00:48 } +2024-07-30 04:08:18,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1125/ 3125], loss: 0.346, per_step_time: 1414ms, lr: 5.992706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:18,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.65416 samples/s/p 2:00:51 } +2024-07-30 04:08:21,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1127/ 3125], loss: 0.462, per_step_time: 1414ms, lr: 5.9893196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:21,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.65667 samples/s/p 2:00:45 } +2024-07-30 04:08:24,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1129/ 3125], loss: 0.196, per_step_time: 1414ms, lr: 5.985932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:24,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.65747 samples/s/p 2:00:41 } +2024-07-30 04:08:26,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1131/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 5.9825456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:26,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.66000 samples/s/p 2:00:35 } +2024-07-30 04:08:29,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1133/ 3125], loss: 0.263, per_step_time: 1415ms, lr: 5.9791573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:29,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.65311 samples/s/p 2:00:41 } +2024-07-30 04:08:32,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1135/ 3125], loss: 0.382, per_step_time: 1413ms, lr: 5.975769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:32,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.66001 samples/s/p 2:00:29 } +2024-07-30 04:08:35,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1137/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 5.9723807e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:35,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.66076 samples/s/p 2:00:25 } +2024-07-30 04:08:38,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1139/ 3125], loss: 0.242, per_step_time: 1412ms, lr: 5.968991e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:38,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.66173 samples/s/p 2:00:21 } +2024-07-30 04:08:41,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1141/ 3125], loss: 0.280, per_step_time: 1412ms, lr: 5.9656018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:41,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.66235 samples/s/p 2:00:18 } +2024-07-30 04:08:43,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1143/ 3125], loss: 0.434, per_step_time: 1413ms, lr: 5.962211e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:43,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.66005 samples/s/p 2:00:18 } +2024-07-30 04:08:46,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1145/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 5.958821e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:46,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.66131 samples/s/p 2:00:13 } +2024-07-30 04:08:49,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1147/ 3125], loss: 0.402, per_step_time: 1416ms, lr: 5.95543e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:49,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.64800 samples/s/p 2:00:28 } +2024-07-30 04:08:52,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1149/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 5.952038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:52,448 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.66028 samples/s/p 2:00:09 } +2024-07-30 04:08:55,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1151/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 5.948646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:55,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.65845 samples/s/p 2:00:09 } +2024-07-30 04:08:58,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1153/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 5.9452536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:58,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.66099 samples/s/p 2:00:02 } +2024-07-30 04:09:00,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1155/ 3125], loss: 0.255, per_step_time: 1412ms, lr: 5.941861e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:00,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.66194 samples/s/p 1:59:58 } +2024-07-30 04:09:03,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1157/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 5.9384674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:03,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.66111 samples/s/p 1:59:57 } +2024-07-30 04:09:06,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1159/ 3125], loss: 0.184, per_step_time: 1414ms, lr: 5.935074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:06,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.65662 samples/s/p 2:00:00 } +2024-07-30 04:09:09,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1161/ 3125], loss: 0.220, per_step_time: 1414ms, lr: 5.9316794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:09,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.65514 samples/s/p 1:59:59 } +2024-07-30 04:09:12,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1163/ 3125], loss: 0.257, per_step_time: 1414ms, lr: 5.9282843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:12,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.65526 samples/s/p 1:59:56 } +2024-07-30 04:09:15,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1165/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 5.92489e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:15,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.65871 samples/s/p 1:59:48 } +2024-07-30 04:09:17,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1167/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 5.921494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:17,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.65816 samples/s/p 1:59:46 } +2024-07-30 04:09:20,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1169/ 3125], loss: 0.143, per_step_time: 1414ms, lr: 5.9180984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:20,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.65422 samples/s/p 1:59:48 } +2024-07-30 04:09:23,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1171/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 5.914702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:23,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.65947 samples/s/p 1:59:39 } +2024-07-30 04:09:26,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1173/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 5.911305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:26,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.65680 samples/s/p 1:59:40 } +2024-07-30 04:09:29,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1175/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 5.9079075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:29,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.65958 samples/s/p 1:59:33 } +2024-07-30 04:09:32,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1177/ 3125], loss: 0.103, per_step_time: 1414ms, lr: 5.90451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:32,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.65686 samples/s/p 1:59:34 } +2024-07-30 04:09:34,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1179/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 5.9011118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:34,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.65987 samples/s/p 1:59:27 } +2024-07-30 04:09:37,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1181/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 5.897713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:37,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.66101 samples/s/p 1:59:23 } +2024-07-30 04:09:40,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1183/ 3125], loss: 0.202, per_step_time: 1415ms, lr: 5.8943137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:40,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.65238 samples/s/p 1:59:31 } +2024-07-30 04:09:43,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1185/ 3125], loss: 0.230, per_step_time: 1414ms, lr: 5.890914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:43,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.65761 samples/s/p 1:59:22 } +2024-07-30 04:09:46,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1187/ 3125], loss: 0.055, per_step_time: 1414ms, lr: 5.887515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:46,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.65447 samples/s/p 1:59:23 } +2024-07-30 04:09:49,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1189/ 3125], loss: 0.270, per_step_time: 1414ms, lr: 5.884114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:49,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |███████████████████████ | 5.65526 samples/s/p 1:59:19 } +2024-07-30 04:09:51,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1191/ 3125], loss: 0.289, per_step_time: 1414ms, lr: 5.880714e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:51,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |███████████████████████ | 5.65639 samples/s/p 1:59:15 } +2024-07-30 04:09:54,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1193/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 5.877312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:54,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.65983 samples/s/p 1:59:07 } +2024-07-30 04:09:57,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1195/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 5.8739106e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:57,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.66092 samples/s/p 1:59:03 } +2024-07-30 04:10:00,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1197/ 3125], loss: 0.185, per_step_time: 1412ms, lr: 5.870509e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:00,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.66250 samples/s/p 1:58:58 } +2024-07-30 04:10:03,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1199/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 5.867106e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:03,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.66110 samples/s/p 1:58:57 } +2024-07-30 04:10:06,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1201/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 5.863704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:06,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.66121 samples/s/p 1:58:54 } +2024-07-30 04:10:08,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1203/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 5.8603005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:08,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.65956 samples/s/p 1:58:54 } +2024-07-30 04:10:11,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1205/ 3125], loss: 0.396, per_step_time: 1412ms, lr: 5.8568967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:11,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.66206 samples/s/p 1:58:48 } +2024-07-30 04:10:14,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1207/ 3125], loss: 0.055, per_step_time: 1441ms, lr: 5.8534924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:14,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.55161 samples/s/p 2:01:07 } +2024-07-30 04:10:17,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1209/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 5.8500887e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:17,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.66127 samples/s/p 1:58:43 } +2024-07-30 04:10:20,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1211/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 5.846684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:20,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.65954 samples/s/p 1:58:42 } +2024-07-30 04:10:23,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1213/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 5.843279e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:23,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.65889 samples/s/p 1:58:40 } +2024-07-30 04:10:26,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1215/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 5.8398728e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:26,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.66018 samples/s/p 1:58:36 } +2024-07-30 04:10:28,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1217/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 5.8364662e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:28,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.65849 samples/s/p 1:58:35 } +2024-07-30 04:10:31,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1219/ 3125], loss: 0.381, per_step_time: 1413ms, lr: 5.83306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:31,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.66108 samples/s/p 1:58:29 } +2024-07-30 04:10:34,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1221/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 5.829653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:34,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.66016 samples/s/p 1:58:27 } +2024-07-30 04:10:37,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1223/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 5.826246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:37,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.65921 samples/s/p 1:58:26 } +2024-07-30 04:10:40,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1225/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 5.8228384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:40,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.66109 samples/s/p 1:58:21 } +2024-07-30 04:10:43,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1227/ 3125], loss: 0.120, per_step_time: 1413ms, lr: 5.81943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:43,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.65791 samples/s/p 1:58:22 } +2024-07-30 04:10:45,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1229/ 3125], loss: 0.150, per_step_time: 1414ms, lr: 5.8160213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:45,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.65579 samples/s/p 1:58:22 } +2024-07-30 04:10:48,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1231/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 5.8126125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:48,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.65922 samples/s/p 1:58:14 } +2024-07-30 04:10:51,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1233/ 3125], loss: 0.504, per_step_time: 1414ms, lr: 5.8092037e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:51,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.65505 samples/s/p 1:58:17 } +2024-07-30 04:10:54,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1235/ 3125], loss: 0.378, per_step_time: 1415ms, lr: 5.805794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:54,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.65074 samples/s/p 1:58:19 } +2024-07-30 04:10:57,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1237/ 3125], loss: 0.145, per_step_time: 1414ms, lr: 5.8023843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:57,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.65492 samples/s/p 1:58:11 } +2024-07-30 04:11:00,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1239/ 3125], loss: 0.475, per_step_time: 1413ms, lr: 5.7989732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:00,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.66006 samples/s/p 1:58:02 } +2024-07-30 04:11:02,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1241/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 5.7955635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:02,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.66148 samples/s/p 1:57:58 } +2024-07-30 04:11:05,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1243/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 5.7921516e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:05,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.66128 samples/s/p 1:57:55 } +2024-07-30 04:11:08,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1245/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 5.7887405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:08,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.66153 samples/s/p 1:57:52 } +2024-07-30 04:11:11,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1247/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 5.7853285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:11,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.66090 samples/s/p 1:57:50 } +2024-07-30 04:11:14,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1249/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 5.781916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:14,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.66105 samples/s/p 1:57:47 } +2024-07-30 04:11:17,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1251/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 5.7785032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:17,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.66101 samples/s/p 1:57:44 } +2024-07-30 04:11:19,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1253/ 3125], loss: 0.485, per_step_time: 1414ms, lr: 5.7750904e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:19,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.65668 samples/s/p 1:57:47 } +2024-07-30 04:11:22,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1255/ 3125], loss: 0.230, per_step_time: 1415ms, lr: 5.7716775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:22,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.65317 samples/s/p 1:57:48 } +2024-07-30 04:11:25,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1257/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 5.7682632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:25,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.65936 samples/s/p 1:57:38 } +2024-07-30 04:11:28,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1259/ 3125], loss: 0.243, per_step_time: 1415ms, lr: 5.7648494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:28,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.65293 samples/s/p 1:57:43 } +2024-07-30 04:11:31,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1261/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 5.7614347e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:31,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.65911 samples/s/p 1:57:32 } +2024-07-30 04:11:34,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1263/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 5.75802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:34,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.65891 samples/s/p 1:57:30 } +2024-07-30 04:11:36,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1265/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 5.754605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:36,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.66135 samples/s/p 1:57:24 } +2024-07-30 04:11:39,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1267/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 5.7511893e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:39,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.65825 samples/s/p 1:57:25 } +2024-07-30 04:11:42,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1269/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 5.7477737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:42,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.65883 samples/s/p 1:57:21 } +2024-07-30 04:11:45,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1271/ 3125], loss: 0.181, per_step_time: 1414ms, lr: 5.7443576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:45,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.65492 samples/s/p 1:57:23 } +2024-07-30 04:11:48,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1273/ 3125], loss: 0.089, per_step_time: 1413ms, lr: 5.7409397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:48,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.66100 samples/s/p 1:57:13 } +2024-07-30 04:11:51,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1275/ 3125], loss: 0.160, per_step_time: 1413ms, lr: 5.737523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:51,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.66061 samples/s/p 1:57:11 } +2024-07-30 04:11:53,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1277/ 3125], loss: 0.148, per_step_time: 1413ms, lr: 5.7341063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:53,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.65945 samples/s/p 1:57:09 } +2024-07-30 04:11:56,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1279/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 5.7306884e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:56,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.65887 samples/s/p 1:57:07 } +2024-07-30 04:11:59,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1281/ 3125], loss: 0.137, per_step_time: 1414ms, lr: 5.7272705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:59,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.65613 samples/s/p 1:57:08 } +2024-07-30 04:12:02,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1283/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 5.723852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:02,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.65872 samples/s/p 1:57:02 } +2024-07-30 04:12:05,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1285/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 5.7204334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:05,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.66116 samples/s/p 1:56:56 } +2024-07-30 04:12:08,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1287/ 3125], loss: 0.295, per_step_time: 1414ms, lr: 5.717014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:08,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.65550 samples/s/p 1:57:00 } +2024-07-30 04:12:10,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1289/ 3125], loss: 0.341, per_step_time: 1413ms, lr: 5.713595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:10,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.66089 samples/s/p 1:56:50 } +2024-07-30 04:12:13,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1291/ 3125], loss: 0.583, per_step_time: 1417ms, lr: 5.7101756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:13,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.64500 samples/s/p 1:57:07 } +2024-07-30 04:12:16,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1293/ 3125], loss: 0.199, per_step_time: 1414ms, lr: 5.7067546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:16,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.65632 samples/s/p 1:56:50 } +2024-07-30 04:12:19,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1295/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 5.703335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:19,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.66093 samples/s/p 1:56:42 } +2024-07-30 04:12:22,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1297/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 5.6999133e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:22,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.66076 samples/s/p 1:56:39 } +2024-07-30 04:12:25,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1299/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 5.6964927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:25,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.66043 samples/s/p 1:56:37 } +2024-07-30 04:12:27,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1301/ 3125], loss: 0.448, per_step_time: 1413ms, lr: 5.6930708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:27,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.66135 samples/s/p 1:56:33 } +2024-07-30 04:12:30,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1303/ 3125], loss: 0.185, per_step_time: 1414ms, lr: 5.6896492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:30,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.65407 samples/s/p 1:56:39 } +2024-07-30 04:12:33,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1305/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 5.6862277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:33,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.65858 samples/s/p 1:56:31 } +2024-07-30 04:12:36,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1307/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 5.682805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:36,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.65938 samples/s/p 1:56:27 } +2024-07-30 04:12:39,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1309/ 3125], loss: 0.323, per_step_time: 1412ms, lr: 5.679382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:39,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.66225 samples/s/p 1:56:20 } +2024-07-30 04:12:42,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1311/ 3125], loss: 0.169, per_step_time: 1413ms, lr: 5.675959e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:42,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.65972 samples/s/p 1:56:21 } +2024-07-30 04:12:44,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1313/ 3125], loss: 0.169, per_step_time: 1413ms, lr: 5.6725357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:44,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.66073 samples/s/p 1:56:17 } +2024-07-30 04:12:47,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1315/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 5.669112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:47,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.66077 samples/s/p 1:56:14 } +2024-07-30 04:12:50,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1317/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 5.665688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:50,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.66140 samples/s/p 1:56:10 } +2024-07-30 04:12:53,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1319/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 5.6622634e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:53,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.65931 samples/s/p 1:56:10 } +2024-07-30 04:12:56,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1321/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 5.658839e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:56,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.66020 samples/s/p 1:56:06 } +2024-07-30 04:12:59,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1323/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 5.6554136e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:59,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.65936 samples/s/p 1:56:04 } +2024-07-30 04:13:01,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1325/ 3125], loss: 0.387, per_step_time: 1413ms, lr: 5.651989e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:01,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.65824 samples/s/p 1:56:03 } +2024-07-30 04:13:04,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1327/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 5.6485633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:04,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.65902 samples/s/p 1:55:59 } +2024-07-30 04:13:07,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1329/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 5.645137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:07,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.65985 samples/s/p 1:55:55 } +2024-07-30 04:13:10,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1331/ 3125], loss: 0.310, per_step_time: 1415ms, lr: 5.6417107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:10,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.65115 samples/s/p 1:56:03 } +2024-07-30 04:13:13,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1333/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 5.6382846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:13,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.66041 samples/s/p 1:55:49 } +2024-07-30 04:13:16,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1335/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 5.6348576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:16,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.65778 samples/s/p 1:55:49 } +2024-07-30 04:13:18,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1337/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 5.63143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:18,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.65977 samples/s/p 1:55:44 } +2024-07-30 04:13:21,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1339/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 5.6280032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:21,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.66092 samples/s/p 1:55:40 } +2024-07-30 04:13:24,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1341/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 5.624575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:24,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.66063 samples/s/p 1:55:37 } +2024-07-30 04:13:27,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1343/ 3125], loss: 0.159, per_step_time: 1414ms, lr: 5.621147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:27,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.65676 samples/s/p 1:55:39 } +2024-07-30 04:13:30,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1345/ 3125], loss: 0.167, per_step_time: 1414ms, lr: 5.6177187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:30,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.65628 samples/s/p 1:55:37 } +2024-07-30 04:13:33,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1347/ 3125], loss: 0.235, per_step_time: 1414ms, lr: 5.61429e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:33,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.65549 samples/s/p 1:55:35 } +2024-07-30 04:13:35,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1349/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 5.6108615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:35,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.65794 samples/s/p 1:55:29 } +2024-07-30 04:13:38,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1351/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 5.607432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:38,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.65843 samples/s/p 1:55:26 } +2024-07-30 04:13:41,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1353/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 5.604002e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:41,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.65870 samples/s/p 1:55:23 } +2024-07-30 04:13:44,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1355/ 3125], loss: 0.400, per_step_time: 1412ms, lr: 5.600573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:44,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.66202 samples/s/p 1:55:16 } +2024-07-30 04:13:47,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1357/ 3125], loss: 0.158, per_step_time: 1413ms, lr: 5.597143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:47,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.66120 samples/s/p 1:55:14 } +2024-07-30 04:13:50,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1359/ 3125], loss: 0.180, per_step_time: 1415ms, lr: 5.593712e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:50,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.65353 samples/s/p 1:55:20 } +2024-07-30 04:13:52,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1361/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 5.590282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:52,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.66134 samples/s/p 1:55:08 } +2024-07-30 04:13:55,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1363/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 5.5868504e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:55,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.65865 samples/s/p 1:55:09 } +2024-07-30 04:13:58,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1365/ 3125], loss: 0.329, per_step_time: 1414ms, lr: 5.583419e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:58,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.65388 samples/s/p 1:55:12 } +2024-07-30 04:14:01,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1367/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 5.579988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:01,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.66010 samples/s/p 1:55:01 } +2024-07-30 04:14:04,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1369/ 3125], loss: 0.155, per_step_time: 1412ms, lr: 5.5765563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:04,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.66235 samples/s/p 1:54:56 } +2024-07-30 04:14:07,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1371/ 3125], loss: 0.182, per_step_time: 1412ms, lr: 5.5731243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:07,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |███████████████████████ | 5.66185 samples/s/p 1:54:53 } +2024-07-30 04:14:09,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1373/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 5.5696914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:09,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |███████████████████████ | 5.65874 samples/s/p 1:54:54 } +2024-07-30 04:14:12,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1375/ 3125], loss: 0.419, per_step_time: 1413ms, lr: 5.566259e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:12,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.66145 samples/s/p 1:54:48 } +2024-07-30 04:14:15,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1377/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 5.562826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:15,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.66104 samples/s/p 1:54:46 } +2024-07-30 04:14:18,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1379/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 5.5593937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:18,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.65813 samples/s/p 1:54:47 } +2024-07-30 04:14:21,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1381/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 5.55596e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:21,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.65859 samples/s/p 1:54:43 } +2024-07-30 04:14:24,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1383/ 3125], loss: 0.308, per_step_time: 1414ms, lr: 5.5525265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:24,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.65761 samples/s/p 1:54:42 } +2024-07-30 04:14:26,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1385/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 5.5490923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:26,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.66023 samples/s/p 1:54:36 } +2024-07-30 04:14:29,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1387/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 5.5456576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:29,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.65952 samples/s/p 1:54:34 } +2024-07-30 04:14:32,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1389/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 5.5422233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:32,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.66081 samples/s/p 1:54:29 } +2024-07-30 04:14:35,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1391/ 3125], loss: 0.410, per_step_time: 1414ms, lr: 5.538789e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:35,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.65745 samples/s/p 1:54:30 } +2024-07-30 04:14:38,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1393/ 3125], loss: 0.129, per_step_time: 1414ms, lr: 5.5353544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:38,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.65730 samples/s/p 1:54:28 } +2024-07-30 04:14:41,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1395/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 5.5319188e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:41,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.65777 samples/s/p 1:54:24 } +2024-07-30 04:14:43,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1397/ 3125], loss: 0.091, per_step_time: 1413ms, lr: 5.5284827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:43,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.65773 samples/s/p 1:54:22 } +2024-07-30 04:14:46,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1399/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 5.5250475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:46,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.65792 samples/s/p 1:54:19 } +2024-07-30 04:14:49,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1401/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 5.521611e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:49,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.65824 samples/s/p 1:54:15 } +2024-07-30 04:14:52,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1403/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 5.5181754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:52,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.65934 samples/s/p 1:54:11 } +2024-07-30 04:14:55,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1405/ 3125], loss: 0.088, per_step_time: 1413ms, lr: 5.514739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:55,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.66092 samples/s/p 1:54:06 } +2024-07-30 04:14:58,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1407/ 3125], loss: 0.266, per_step_time: 1414ms, lr: 5.5113014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:58,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.65631 samples/s/p 1:54:09 } +2024-07-30 04:15:00,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1409/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 5.507865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:00,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.65896 samples/s/p 1:54:03 } +2024-07-30 04:15:03,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1411/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 5.5044275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:03,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.66014 samples/s/p 1:53:59 } +2024-07-30 04:15:06,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1413/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 5.5009905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:06,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.66110 samples/s/p 1:53:55 } +2024-07-30 04:15:09,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1415/ 3125], loss: 0.205, per_step_time: 1414ms, lr: 5.497553e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:09,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.65640 samples/s/p 1:53:58 } +2024-07-30 04:15:12,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1417/ 3125], loss: 0.527, per_step_time: 1413ms, lr: 5.4941147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:12,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.66043 samples/s/p 1:53:50 } +2024-07-30 04:15:15,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1419/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 5.490676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:15,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.66116 samples/s/p 1:53:46 } +2024-07-30 04:15:17,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1421/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 5.487238e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:17,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.65926 samples/s/p 1:53:46 } +2024-07-30 04:15:20,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1423/ 3125], loss: 0.402, per_step_time: 1414ms, lr: 5.483799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:20,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.65701 samples/s/p 1:53:46 } +2024-07-30 04:15:23,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1425/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 5.480361e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:23,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.65932 samples/s/p 1:53:40 } +2024-07-30 04:15:26,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1427/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 5.4769216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:26,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.65809 samples/s/p 1:53:39 } +2024-07-30 04:15:29,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1429/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 5.4734824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:29,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.65965 samples/s/p 1:53:34 } +2024-07-30 04:15:32,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1431/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 5.470042e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:32,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.65932 samples/s/p 1:53:32 } +2024-07-30 04:15:34,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1433/ 3125], loss: 0.308, per_step_time: 1412ms, lr: 5.466603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:34,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.66217 samples/s/p 1:53:25 } +2024-07-30 04:15:37,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1435/ 3125], loss: 0.118, per_step_time: 1413ms, lr: 5.4631632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:37,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.66105 samples/s/p 1:53:24 } +2024-07-30 04:15:40,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1437/ 3125], loss: 0.206, per_step_time: 1412ms, lr: 5.4597226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:40,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.66181 samples/s/p 1:53:20 } +2024-07-30 04:15:43,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1439/ 3125], loss: 0.162, per_step_time: 1412ms, lr: 5.4562825e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:43,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.66179 samples/s/p 1:53:17 } +2024-07-30 04:15:46,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1441/ 3125], loss: 0.353, per_step_time: 1413ms, lr: 5.4528414e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:46,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.66135 samples/s/p 1:53:15 } +2024-07-30 04:15:49,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1443/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 5.449401e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:49,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.65971 samples/s/p 1:53:14 } +2024-07-30 04:15:51,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1445/ 3125], loss: 0.317, per_step_time: 1415ms, lr: 5.4459592e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:51,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.65214 samples/s/p 1:53:20 } +2024-07-30 04:15:54,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1447/ 3125], loss: 0.117, per_step_time: 1414ms, lr: 5.4425186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:54,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.65563 samples/s/p 1:53:13 } +2024-07-30 04:15:57,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1449/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 5.4390775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:57,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.66124 samples/s/p 1:53:04 } +2024-07-30 04:16:00,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1451/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 5.435635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:00,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.65931 samples/s/p 1:53:03 } +2024-07-30 04:16:03,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1453/ 3125], loss: 0.465, per_step_time: 1415ms, lr: 5.432193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:03,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.65173 samples/s/p 1:53:10 } +2024-07-30 04:16:06,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1455/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 5.428751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:06,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.66014 samples/s/p 1:52:57 } +2024-07-30 04:16:09,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1457/ 3125], loss: 0.395, per_step_time: 1413ms, lr: 5.4253087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:09,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.65783 samples/s/p 1:52:57 } +2024-07-30 04:16:11,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1459/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 5.4218663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:11,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.66124 samples/s/p 1:52:50 } +2024-07-30 04:16:14,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1461/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 5.418424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:14,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.66141 samples/s/p 1:52:47 } +2024-07-30 04:16:17,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1463/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 5.4149805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:17,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.65936 samples/s/p 1:52:46 } +2024-07-30 04:16:20,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1465/ 3125], loss: 0.274, per_step_time: 1412ms, lr: 5.4115376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:20,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.66190 samples/s/p 1:52:40 } +2024-07-30 04:16:23,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1467/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 5.408094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:23,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.66033 samples/s/p 1:52:40 } +2024-07-30 04:16:26,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1469/ 3125], loss: 0.137, per_step_time: 1414ms, lr: 5.4046504e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:26,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.65712 samples/s/p 1:52:41 } +2024-07-30 04:16:28,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1471/ 3125], loss: 0.181, per_step_time: 1415ms, lr: 5.401207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:28,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.65362 samples/s/p 1:52:42 } +2024-07-30 04:16:31,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1473/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 5.3977633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:31,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.65891 samples/s/p 1:52:33 } +2024-07-30 04:16:34,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1475/ 3125], loss: 0.199, per_step_time: 1412ms, lr: 5.3943186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:34,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.66221 samples/s/p 1:52:26 } +2024-07-30 04:16:37,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1477/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 5.390875e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:37,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.65989 samples/s/p 1:52:26 } +2024-07-30 04:16:40,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1479/ 3125], loss: 0.233, per_step_time: 1414ms, lr: 5.38743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:40,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.65751 samples/s/p 1:52:26 } +2024-07-30 04:16:43,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1481/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 5.3839854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:43,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.65884 samples/s/p 1:52:22 } +2024-07-30 04:16:45,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1483/ 3125], loss: 0.105, per_step_time: 1413ms, lr: 5.380541e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:45,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.65806 samples/s/p 1:52:20 } +2024-07-30 04:16:48,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1485/ 3125], loss: 0.235, per_step_time: 1414ms, lr: 5.377095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:48,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.65761 samples/s/p 1:52:17 } +2024-07-30 04:16:51,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1487/ 3125], loss: 0.394, per_step_time: 1413ms, lr: 5.3736508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:51,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.66086 samples/s/p 1:52:11 } +2024-07-30 04:16:54,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1489/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 5.3702047e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:54,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.66087 samples/s/p 1:52:08 } +2024-07-30 04:16:57,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1491/ 3125], loss: 0.266, per_step_time: 1412ms, lr: 5.366759e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:57,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.66209 samples/s/p 1:52:04 } +2024-07-30 04:17:00,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1493/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 5.363314e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:00,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.65987 samples/s/p 1:52:03 } +2024-07-30 04:17:02,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1495/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 5.359868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:02,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.65936 samples/s/p 1:52:01 } +2024-07-30 04:17:05,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1497/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 5.3564213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:05,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.66110 samples/s/p 1:51:56 } +2024-07-30 04:17:08,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1499/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 5.3529757e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:08,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.66090 samples/s/p 1:51:54 } +2024-07-30 04:17:11,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1501/ 3125], loss: 0.433, per_step_time: 1412ms, lr: 5.349529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:11,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.66229 samples/s/p 1:51:49 } +2024-07-30 04:17:14,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1503/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 5.346082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:14,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.66048 samples/s/p 1:51:48 } +2024-07-30 04:17:17,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1505/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 5.342636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:17,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.66025 samples/s/p 1:51:46 } +2024-07-30 04:17:19,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1507/ 3125], loss: 0.189, per_step_time: 1415ms, lr: 5.3391886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:19,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.64987 samples/s/p 1:51:55 } +2024-07-30 04:17:22,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1509/ 3125], loss: 0.314, per_step_time: 1414ms, lr: 5.3357408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:22,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.65658 samples/s/p 1:51:45 } +2024-07-30 04:17:25,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1511/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 5.3322938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:25,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.65936 samples/s/p 1:51:38 } +2024-07-30 04:17:28,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1513/ 3125], loss: 0.266, per_step_time: 1414ms, lr: 5.3288472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:28,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.65713 samples/s/p 1:51:38 } +2024-07-30 04:17:31,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1515/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 5.3253993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:31,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.65858 samples/s/p 1:51:34 } +2024-07-30 04:17:34,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1517/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 5.321952e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:34,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.65985 samples/s/p 1:51:29 } +2024-07-30 04:17:36,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1519/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 5.318504e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:36,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.66170 samples/s/p 1:51:24 } +2024-07-30 04:17:39,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1521/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 5.3150557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:39,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.66094 samples/s/p 1:51:22 } +2024-07-30 04:17:42,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1523/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 5.311608e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:42,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.66147 samples/s/p 1:51:19 } +2024-07-30 04:17:45,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1525/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 5.3081594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:45,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.66094 samples/s/p 1:51:17 } +2024-07-30 04:17:48,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1527/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 5.3047115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:48,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.66036 samples/s/p 1:51:15 } +2024-07-30 04:17:51,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1529/ 3125], loss: 0.350, per_step_time: 1412ms, lr: 5.301262e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:51,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.66208 samples/s/p 1:51:10 } +2024-07-30 04:17:53,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1531/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 5.2978135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:53,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.66097 samples/s/p 1:51:08 } +2024-07-30 04:17:56,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1533/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 5.2943647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:56,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.65862 samples/s/p 1:51:08 } +2024-07-30 04:17:59,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1535/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 5.290916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:59,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.65931 samples/s/p 1:51:05 } +2024-07-30 04:18:02,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1537/ 3125], loss: 0.267, per_step_time: 1414ms, lr: 5.287467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:02,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.65737 samples/s/p 1:51:04 } +2024-07-30 04:18:05,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1539/ 3125], loss: 0.230, per_step_time: 1414ms, lr: 5.2840173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:05,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.65722 samples/s/p 1:51:01 } +2024-07-30 04:18:08,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1541/ 3125], loss: 0.258, per_step_time: 1412ms, lr: 5.280567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:08,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.66288 samples/s/p 1:50:52 } +2024-07-30 04:18:10,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1543/ 3125], loss: 0.397, per_step_time: 1414ms, lr: 5.277118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:10,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.65450 samples/s/p 1:50:59 } +2024-07-30 04:18:13,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1545/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 5.2736686e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:13,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.66109 samples/s/p 1:50:48 } +2024-07-30 04:18:16,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1547/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 5.270219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:16,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.66073 samples/s/p 1:50:46 } +2024-07-30 04:18:19,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1549/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 5.2667688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:19,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.65903 samples/s/p 1:50:45 } +2024-07-30 04:18:22,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1551/ 3125], loss: 0.416, per_step_time: 1414ms, lr: 5.263318e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:22,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.65421 samples/s/p 1:50:48 } +2024-07-30 04:18:25,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1553/ 3125], loss: 0.129, per_step_time: 1413ms, lr: 5.259868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:25,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.65834 samples/s/p 1:50:40 } +2024-07-30 04:18:27,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1555/ 3125], loss: 0.323, per_step_time: 1414ms, lr: 5.256418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:27,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.65464 samples/s/p 1:50:42 } +2024-07-30 04:18:30,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1557/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 5.252967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:30,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.66167 samples/s/p 1:50:31 } +2024-07-30 04:18:33,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1559/ 3125], loss: 0.420, per_step_time: 1413ms, lr: 5.2495175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:33,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |████████████████████████ | 5.65858 samples/s/p 1:50:32 } +2024-07-30 04:18:36,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1561/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 5.2460664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:36,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |████████████████████████ | 5.65790 samples/s/p 1:50:30 } +2024-07-30 04:18:39,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1563/ 3125], loss: 0.212, per_step_time: 1414ms, lr: 5.2426153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:39,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.65422 samples/s/p 1:50:31 } +2024-07-30 04:18:42,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1565/ 3125], loss: 0.401, per_step_time: 1413ms, lr: 5.2391642e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:42,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.65815 samples/s/p 1:50:24 } +2024-07-30 04:18:44,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1567/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 5.235713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:44,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.65842 samples/s/p 1:50:20 } +2024-07-30 04:18:47,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1569/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 5.232262e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:47,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.66080 samples/s/p 1:50:15 } +2024-07-30 04:18:50,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1571/ 3125], loss: 0.227, per_step_time: 1412ms, lr: 5.2288115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:50,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.66258 samples/s/p 1:50:10 } +2024-07-30 04:18:53,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1573/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 5.225359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:53,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.65975 samples/s/p 1:50:10 } +2024-07-30 04:18:56,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1575/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 5.2219075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:56,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.66051 samples/s/p 1:50:07 } +2024-07-30 04:18:59,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1577/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 5.2184564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:59,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.65880 samples/s/p 1:50:06 } +2024-07-30 04:19:01,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1579/ 3125], loss: 0.439, per_step_time: 1413ms, lr: 5.2150044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:01,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.65928 samples/s/p 1:50:02 } +2024-07-30 04:19:04,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1581/ 3125], loss: 0.413, per_step_time: 1416ms, lr: 5.2115533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:04,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.64674 samples/s/p 1:50:14 } +2024-07-30 04:19:07,565 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1583/ 3125], loss: 0.246, per_step_time: 1412ms, lr: 5.2081014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:07,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.66203 samples/s/p 1:49:54 } +2024-07-30 04:19:10,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1585/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 5.204649e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:10,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.66133 samples/s/p 1:49:52 } +2024-07-30 04:19:13,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1587/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 5.2011965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:13,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.65907 samples/s/p 1:49:51 } +2024-07-30 04:19:16,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1589/ 3125], loss: 0.198, per_step_time: 1416ms, lr: 5.197744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:16,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.64743 samples/s/p 1:50:02 } +2024-07-30 04:19:18,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1591/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 5.1942925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:18,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.65981 samples/s/p 1:49:45 } +2024-07-30 04:19:21,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1593/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 5.19084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:21,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.66012 samples/s/p 1:49:42 } +2024-07-30 04:19:24,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1595/ 3125], loss: 0.381, per_step_time: 1412ms, lr: 5.187388e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:24,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.66270 samples/s/p 1:49:36 } +2024-07-30 04:19:27,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1597/ 3125], loss: 0.323, per_step_time: 1414ms, lr: 5.1839343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:27,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.65534 samples/s/p 1:49:42 } +2024-07-30 04:19:30,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1599/ 3125], loss: 0.192, per_step_time: 1412ms, lr: 5.1804823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:30,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.66213 samples/s/p 1:49:31 } +2024-07-30 04:19:33,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1601/ 3125], loss: 0.433, per_step_time: 1413ms, lr: 5.17703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:33,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.66045 samples/s/p 1:49:30 } +2024-07-30 04:19:35,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1603/ 3125], loss: 0.372, per_step_time: 1414ms, lr: 5.1735765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:35,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.65560 samples/s/p 1:49:33 } +2024-07-30 04:19:38,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1605/ 3125], loss: 0.489, per_step_time: 1412ms, lr: 5.170124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:38,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.66304 samples/s/p 1:49:21 } +2024-07-30 04:19:41,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1607/ 3125], loss: 0.258, per_step_time: 1414ms, lr: 5.166671e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:41,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.65648 samples/s/p 1:49:26 } +2024-07-30 04:19:44,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1609/ 3125], loss: 0.203, per_step_time: 1414ms, lr: 5.163218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:44,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.65615 samples/s/p 1:49:24 } +2024-07-30 04:19:47,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1611/ 3125], loss: 0.286, per_step_time: 1414ms, lr: 5.159764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:47,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.65653 samples/s/p 1:49:20 } +2024-07-30 04:19:50,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1613/ 3125], loss: 0.345, per_step_time: 1414ms, lr: 5.156311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:50,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.65555 samples/s/p 1:49:19 } +2024-07-30 04:19:52,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1615/ 3125], loss: 0.214, per_step_time: 1414ms, lr: 5.152858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:52,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.65766 samples/s/p 1:49:13 } +2024-07-30 04:19:55,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1617/ 3125], loss: 0.555, per_step_time: 1413ms, lr: 5.149405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:55,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.66149 samples/s/p 1:49:06 } +2024-07-30 04:19:58,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1619/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 5.1459515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:58,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.66155 samples/s/p 1:49:03 } +2024-07-30 04:20:01,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1621/ 3125], loss: 0.141, per_step_time: 1413ms, lr: 5.1424972e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:01,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.66116 samples/s/p 1:49:01 } +2024-07-30 04:20:04,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1623/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 5.1390443e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:04,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.65916 samples/s/p 1:49:00 } +2024-07-30 04:20:07,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1625/ 3125], loss: 0.078, per_step_time: 1414ms, lr: 5.1355905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:07,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.65727 samples/s/p 1:49:00 } +2024-07-30 04:20:09,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1627/ 3125], loss: 0.106, per_step_time: 1414ms, lr: 5.1321367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:09,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.65613 samples/s/p 1:48:58 } +2024-07-30 04:20:12,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1629/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 5.1286834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:12,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.65891 samples/s/p 1:48:52 } +2024-07-30 04:20:15,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1631/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 5.125229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:15,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.65956 samples/s/p 1:48:49 } +2024-07-30 04:20:18,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1633/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 5.1217744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:18,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.66106 samples/s/p 1:48:44 } +2024-07-30 04:20:21,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1635/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 5.118321e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:21,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.65809 samples/s/p 1:48:45 } +2024-07-30 04:20:24,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1637/ 3125], loss: 0.503, per_step_time: 1413ms, lr: 5.1148677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:24,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.65954 samples/s/p 1:48:40 } +2024-07-30 04:20:26,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1639/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 5.111413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:26,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.66030 samples/s/p 1:48:36 } +2024-07-30 04:20:29,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1641/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 5.107959e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:29,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.65968 samples/s/p 1:48:34 } +2024-07-30 04:20:32,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1643/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 5.104505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:32,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.66006 samples/s/p 1:48:31 } +2024-07-30 04:20:35,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1645/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 5.1010506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:35,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.66050 samples/s/p 1:48:28 } +2024-07-30 04:20:38,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1647/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 5.097596e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:38,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.66051 samples/s/p 1:48:25 } +2024-07-30 04:20:41,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1649/ 3125], loss: 0.307, per_step_time: 1412ms, lr: 5.0941417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:41,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.66245 samples/s/p 1:48:20 } +2024-07-30 04:20:43,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1651/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 5.090688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:43,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.65980 samples/s/p 1:48:20 } +2024-07-30 04:20:46,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1653/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 5.087233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:46,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.66065 samples/s/p 1:48:16 } +2024-07-30 04:20:49,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1655/ 3125], loss: 0.417, per_step_time: 1413ms, lr: 5.0837784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:49,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.66136 samples/s/p 1:48:13 } +2024-07-30 04:20:52,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1657/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 5.080324e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:52,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.65961 samples/s/p 1:48:12 } +2024-07-30 04:20:55,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1659/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 5.0768704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:55,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.65981 samples/s/p 1:48:09 } +2024-07-30 04:20:58,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1661/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 5.0734147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:58,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.66041 samples/s/p 1:48:05 } +2024-07-30 04:21:00,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1663/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 5.069961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:00,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.65884 samples/s/p 1:48:04 } +2024-07-30 04:21:03,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1665/ 3125], loss: 0.072, per_step_time: 1413ms, lr: 5.0665058e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:03,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.65854 samples/s/p 1:48:02 } +2024-07-30 04:21:06,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1667/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 5.0630515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:06,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.65963 samples/s/p 1:47:58 } +2024-07-30 04:21:09,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1669/ 3125], loss: 0.248, per_step_time: 1414ms, lr: 5.0595963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:09,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.65751 samples/s/p 1:47:57 } +2024-07-30 04:21:12,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1671/ 3125], loss: 0.339, per_step_time: 1414ms, lr: 5.056142e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:12,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.65707 samples/s/p 1:47:55 } +2024-07-30 04:21:15,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1673/ 3125], loss: 0.259, per_step_time: 1415ms, lr: 5.0526874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:15,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.65116 samples/s/p 1:47:59 } +2024-07-30 04:21:17,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1675/ 3125], loss: 0.445, per_step_time: 1413ms, lr: 5.049232e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:17,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.65819 samples/s/p 1:47:48 } +2024-07-30 04:21:20,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1677/ 3125], loss: 0.251, per_step_time: 1415ms, lr: 5.0457775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:20,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.65359 samples/s/p 1:47:50 } +2024-07-30 04:21:23,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1679/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 5.0423228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:23,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.66090 samples/s/p 1:47:39 } +2024-07-30 04:21:26,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1681/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 5.038868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:26,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.66040 samples/s/p 1:47:37 } +2024-07-30 04:21:29,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1683/ 3125], loss: 0.127, per_step_time: 1413ms, lr: 5.035413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:29,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.66052 samples/s/p 1:47:34 } +2024-07-30 04:21:32,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1685/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 5.031958e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:32,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.66031 samples/s/p 1:47:31 } +2024-07-30 04:21:34,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1687/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 5.028503e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:34,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.65798 samples/s/p 1:47:31 } +2024-07-30 04:21:37,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1689/ 3125], loss: 0.306, per_step_time: 1414ms, lr: 5.0250483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:37,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.65705 samples/s/p 1:47:30 } +2024-07-30 04:21:40,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1691/ 3125], loss: 0.229, per_step_time: 1412ms, lr: 5.0215936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:40,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.66229 samples/s/p 1:47:21 } +2024-07-30 04:21:43,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1693/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 5.018139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:43,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.66063 samples/s/p 1:47:20 } +2024-07-30 04:21:46,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1695/ 3125], loss: 0.254, per_step_time: 1414ms, lr: 5.014684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:46,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.65614 samples/s/p 1:47:22 } +2024-07-30 04:21:49,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1697/ 3125], loss: 0.421, per_step_time: 1413ms, lr: 5.011229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:49,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.65965 samples/s/p 1:47:15 } +2024-07-30 04:21:51,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1699/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 5.0077733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:51,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.65993 samples/s/p 1:47:12 } +2024-07-30 04:21:54,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1701/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 5.0043186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:54,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.66113 samples/s/p 1:47:08 } +2024-07-30 04:21:57,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1703/ 3125], loss: 0.478, per_step_time: 1413ms, lr: 5.0008643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:57,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.65967 samples/s/p 1:47:07 } +2024-07-30 04:22:00,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1705/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 4.997409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:00,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.65906 samples/s/p 1:47:05 } +2024-07-30 04:22:03,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1707/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 4.993954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:03,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.66065 samples/s/p 1:47:00 } +2024-07-30 04:22:06,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1709/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 4.9904984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:06,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.65858 samples/s/p 1:46:59 } +2024-07-30 04:22:08,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1711/ 3125], loss: 0.178, per_step_time: 1412ms, lr: 4.987043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:08,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.66265 samples/s/p 1:46:52 } +2024-07-30 04:22:11,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1713/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 4.9835885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:11,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.66108 samples/s/p 1:46:51 } +2024-07-30 04:22:14,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1715/ 3125], loss: 0.193, per_step_time: 1412ms, lr: 4.980134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:14,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.66290 samples/s/p 1:46:46 } +2024-07-30 04:22:17,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1717/ 3125], loss: 0.197, per_step_time: 1414ms, lr: 4.9766795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:17,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.65715 samples/s/p 1:46:50 } +2024-07-30 04:22:20,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1719/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 4.9732243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:20,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.65963 samples/s/p 1:46:44 } +2024-07-30 04:22:23,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1721/ 3125], loss: 0.137, per_step_time: 1413ms, lr: 4.9697696e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:23,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.66027 samples/s/p 1:46:41 } +2024-07-30 04:22:25,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1723/ 3125], loss: 0.300, per_step_time: 1414ms, lr: 4.9663136e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:25,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.65424 samples/s/p 1:46:45 } +2024-07-30 04:22:28,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1725/ 3125], loss: 0.293, per_step_time: 1413ms, lr: 4.962859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:28,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.65853 samples/s/p 1:46:37 } +2024-07-30 04:22:31,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1727/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 4.9594046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:31,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.66121 samples/s/p 1:46:31 } +2024-07-30 04:22:34,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1729/ 3125], loss: 0.349, per_step_time: 1413ms, lr: 4.95595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:34,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.66117 samples/s/p 1:46:28 } +2024-07-30 04:22:37,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1731/ 3125], loss: 0.312, per_step_time: 1414ms, lr: 4.952495e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:37,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.65723 samples/s/p 1:46:30 } +2024-07-30 04:22:40,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1733/ 3125], loss: 0.057, per_step_time: 1413ms, lr: 4.9490404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:40,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.66017 samples/s/p 1:46:24 } +2024-07-30 04:22:42,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1735/ 3125], loss: 0.251, per_step_time: 1414ms, lr: 4.9455857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:42,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.65632 samples/s/p 1:46:25 } +2024-07-30 04:22:45,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1737/ 3125], loss: 0.193, per_step_time: 1415ms, lr: 4.9421305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:45,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.65235 samples/s/p 1:46:27 } +2024-07-30 04:22:48,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1739/ 3125], loss: 0.235, per_step_time: 1413ms, lr: 4.938676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:48,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.65970 samples/s/p 1:46:16 } +2024-07-30 04:22:51,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1741/ 3125], loss: 0.430, per_step_time: 1412ms, lr: 4.935221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:51,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.66292 samples/s/p 1:46:09 } +2024-07-30 04:22:54,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1743/ 3125], loss: 0.451, per_step_time: 1413ms, lr: 4.9317664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:54,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.66077 samples/s/p 1:46:09 } +2024-07-30 04:22:57,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1745/ 3125], loss: 0.326, per_step_time: 1412ms, lr: 4.928312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:57,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.66238 samples/s/p 1:46:04 } +2024-07-30 04:22:59,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1747/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 4.924858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:59,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |█████████████████████████ | 5.66106 samples/s/p 1:46:03 } +2024-07-30 04:23:02,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1749/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 4.9214036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:02,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |█████████████████████████ | 5.65894 samples/s/p 1:46:03 } +2024-07-30 04:23:05,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1751/ 3125], loss: 0.166, per_step_time: 1412ms, lr: 4.917948e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:05,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.66200 samples/s/p 1:45:56 } +2024-07-30 04:23:08,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1753/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 4.9144937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:08,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.65903 samples/s/p 1:45:57 } +2024-07-30 04:23:11,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1755/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 4.911039e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:11,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.65821 samples/s/p 1:45:55 } +2024-07-30 04:23:14,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1757/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 4.9075848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:14,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.65409 samples/s/p 1:45:57 } +2024-07-30 04:23:16,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1759/ 3125], loss: 0.143, per_step_time: 1412ms, lr: 4.904131e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:16,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.66249 samples/s/p 1:45:44 } +2024-07-30 04:23:19,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1761/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 4.9006767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:19,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.65791 samples/s/p 1:45:47 } +2024-07-30 04:23:22,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1763/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 4.8972224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:22,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.66157 samples/s/p 1:45:40 } +2024-07-30 04:23:25,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1765/ 3125], loss: 0.257, per_step_time: 1412ms, lr: 4.8937677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:25,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.66232 samples/s/p 1:45:36 } +2024-07-30 04:23:28,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1767/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 4.8903134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:28,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.65905 samples/s/p 1:45:37 } +2024-07-30 04:23:31,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1769/ 3125], loss: 0.370, per_step_time: 1414ms, lr: 4.8868596e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:31,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.65712 samples/s/p 1:45:36 } +2024-07-30 04:23:33,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1771/ 3125], loss: 0.291, per_step_time: 1413ms, lr: 4.883406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:33,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.65894 samples/s/p 1:45:31 } +2024-07-30 04:23:36,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1773/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 4.879952e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:36,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.65952 samples/s/p 1:45:28 } +2024-07-30 04:23:39,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1775/ 3125], loss: 0.125, per_step_time: 1413ms, lr: 4.8764978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:39,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.66120 samples/s/p 1:45:23 } +2024-07-30 04:23:42,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1777/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 4.873044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:42,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.66072 samples/s/p 1:45:21 } +2024-07-30 04:23:45,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1779/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 4.8695906e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:45,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.66055 samples/s/p 1:45:18 } +2024-07-30 04:23:48,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1781/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 4.866136e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:48,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.65871 samples/s/p 1:45:18 } +2024-07-30 04:23:50,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1783/ 3125], loss: 0.181, per_step_time: 1412ms, lr: 4.8626825e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:50,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.66312 samples/s/p 1:45:10 } +2024-07-30 04:23:53,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1785/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 4.859229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:53,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.66016 samples/s/p 1:45:10 } +2024-07-30 04:23:56,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1787/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 4.855775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:56,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.65957 samples/s/p 1:45:08 } +2024-07-30 04:23:59,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1789/ 3125], loss: 0.286, per_step_time: 1414ms, lr: 4.852322e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:59,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.65732 samples/s/p 1:45:08 } +2024-07-30 04:24:02,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1791/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 4.8488687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:02,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.65791 samples/s/p 1:45:04 } +2024-07-30 04:24:05,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1793/ 3125], loss: 0.276, per_step_time: 1414ms, lr: 4.845416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:05,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.65645 samples/s/p 1:45:03 } +2024-07-30 04:24:07,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1795/ 3125], loss: 0.285, per_step_time: 1414ms, lr: 4.8419615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:07,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.65750 samples/s/p 1:44:59 } +2024-07-30 04:24:10,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1797/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 4.8385086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:10,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.65838 samples/s/p 1:44:55 } +2024-07-30 04:24:13,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1799/ 3125], loss: 0.273, per_step_time: 1412ms, lr: 4.8350553e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:13,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.66215 samples/s/p 1:44:48 } +2024-07-30 04:24:16,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1801/ 3125], loss: 0.288, per_step_time: 1415ms, lr: 4.8316024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:16,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.65145 samples/s/p 1:44:57 } +2024-07-30 04:24:19,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1803/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 4.82815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:19,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.66043 samples/s/p 1:44:45 } +2024-07-30 04:24:22,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1805/ 3125], loss: 0.420, per_step_time: 1412ms, lr: 4.824697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:22,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.66280 samples/s/p 1:44:39 } +2024-07-30 04:24:25,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1807/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 4.821244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:25,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.66037 samples/s/p 1:44:39 } +2024-07-30 04:24:27,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1809/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 4.8177913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:27,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.66135 samples/s/p 1:44:35 } +2024-07-30 04:24:30,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1811/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 4.814338e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:30,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.66106 samples/s/p 1:44:33 } +2024-07-30 04:24:33,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1813/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 4.810886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:33,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.65871 samples/s/p 1:44:32 } +2024-07-30 04:24:36,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1815/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 4.8074335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:36,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.66049 samples/s/p 1:44:28 } +2024-07-30 04:24:39,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1817/ 3125], loss: 0.556, per_step_time: 1413ms, lr: 4.8039815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:39,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.65955 samples/s/p 1:44:26 } +2024-07-30 04:24:42,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1819/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 4.800529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:42,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.66149 samples/s/p 1:44:21 } +2024-07-30 04:24:44,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1821/ 3125], loss: 0.168, per_step_time: 1412ms, lr: 4.797077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:44,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.66219 samples/s/p 1:44:17 } +2024-07-30 04:24:47,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1823/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 4.793624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:47,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.65811 samples/s/p 1:44:19 } +2024-07-30 04:24:50,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1825/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 4.7901726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:50,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.65992 samples/s/p 1:44:14 } +2024-07-30 04:24:53,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1827/ 3125], loss: 0.103, per_step_time: 1413ms, lr: 4.7867206e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:53,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.65952 samples/s/p 1:44:12 } +2024-07-30 04:24:56,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1829/ 3125], loss: 0.094, per_step_time: 1413ms, lr: 4.7832696e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:56,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.65860 samples/s/p 1:44:10 } +2024-07-30 04:24:59,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1831/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 4.779817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:59,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.66007 samples/s/p 1:44:05 } +2024-07-30 04:25:01,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1833/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 4.776366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:01,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.66100 samples/s/p 1:44:02 } +2024-07-30 04:25:04,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1835/ 3125], loss: 0.141, per_step_time: 1413ms, lr: 4.772915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:04,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.66039 samples/s/p 1:43:59 } +2024-07-30 04:25:07,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1837/ 3125], loss: 0.406, per_step_time: 1417ms, lr: 4.769464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:07,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.64453 samples/s/p 1:44:14 } +2024-07-30 04:25:10,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1839/ 3125], loss: 0.384, per_step_time: 1413ms, lr: 4.766012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:10,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.66115 samples/s/p 1:43:53 } +2024-07-30 04:25:13,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1841/ 3125], loss: 0.415, per_step_time: 1413ms, lr: 4.762561e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:13,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.65953 samples/s/p 1:43:52 } +2024-07-30 04:25:16,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1843/ 3125], loss: 0.231, per_step_time: 1414ms, lr: 4.7591093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:16,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.65381 samples/s/p 1:43:55 } +2024-07-30 04:25:18,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1845/ 3125], loss: 0.663, per_step_time: 1416ms, lr: 4.755659e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:18,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.64694 samples/s/p 1:44:00 } +2024-07-30 04:25:21,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1847/ 3125], loss: 0.470, per_step_time: 1413ms, lr: 4.7522085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:21,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.65979 samples/s/p 1:43:43 } +2024-07-30 04:25:24,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1849/ 3125], loss: 0.412, per_step_time: 1414ms, lr: 4.748758e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:24,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.65714 samples/s/p 1:43:43 } +2024-07-30 04:25:27,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1851/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 4.7453073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:27,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.66041 samples/s/p 1:43:37 } +2024-07-30 04:25:30,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1853/ 3125], loss: 0.385, per_step_time: 1413ms, lr: 4.741856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:30,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.65878 samples/s/p 1:43:36 } +2024-07-30 04:25:33,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1855/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 4.738406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:33,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.66167 samples/s/p 1:43:30 } +2024-07-30 04:25:35,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1857/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 4.734956e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:35,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.66108 samples/s/p 1:43:28 } +2024-07-30 04:25:38,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1859/ 3125], loss: 0.089, per_step_time: 1414ms, lr: 4.731506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:38,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.65378 samples/s/p 1:43:33 } +2024-07-30 04:25:41,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1861/ 3125], loss: 0.364, per_step_time: 1414ms, lr: 4.728057e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:41,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.65708 samples/s/p 1:43:26 } +2024-07-30 04:25:44,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1863/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 4.7246062e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:44,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.65960 samples/s/p 1:43:21 } +2024-07-30 04:25:47,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1865/ 3125], loss: 0.362, per_step_time: 1414ms, lr: 4.721157e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:47,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.65721 samples/s/p 1:43:20 } +2024-07-30 04:25:50,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1867/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 4.717707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:50,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.65947 samples/s/p 1:43:15 } +2024-07-30 04:25:52,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1869/ 3125], loss: 0.168, per_step_time: 1412ms, lr: 4.7142576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:52,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.66172 samples/s/p 1:43:10 } +2024-07-30 04:25:55,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1871/ 3125], loss: 0.289, per_step_time: 1416ms, lr: 4.7108088e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:55,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.64932 samples/s/p 1:43:21 } +2024-07-30 04:25:58,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1873/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 4.70736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:58,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.66117 samples/s/p 1:43:05 } +2024-07-30 04:26:01,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1875/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 4.7039107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:01,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.66118 samples/s/p 1:43:02 } +2024-07-30 04:26:04,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1877/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 4.700462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:04,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.66039 samples/s/p 1:43:00 } +2024-07-30 04:26:07,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1879/ 3125], loss: 0.197, per_step_time: 1413ms, lr: 4.6970135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:07,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.65991 samples/s/p 1:42:58 } +2024-07-30 04:26:09,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1881/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 4.6935643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:09,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.65868 samples/s/p 1:42:56 } +2024-07-30 04:26:12,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1883/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 4.690116e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:12,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.65894 samples/s/p 1:42:53 } +2024-07-30 04:26:15,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1885/ 3125], loss: 0.450, per_step_time: 1412ms, lr: 4.686668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:15,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.66305 samples/s/p 1:42:46 } +2024-07-30 04:26:18,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1887/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 4.6832197e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:18,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.65925 samples/s/p 1:42:47 } +2024-07-30 04:26:21,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1889/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 4.679772e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:21,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.65847 samples/s/p 1:42:45 } +2024-07-30 04:26:24,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1891/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 4.6763244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:24,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.65853 samples/s/p 1:42:42 } +2024-07-30 04:26:26,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1893/ 3125], loss: 0.161, per_step_time: 1414ms, lr: 4.672877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:26,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.65663 samples/s/p 1:42:41 } +2024-07-30 04:26:29,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1895/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 4.6694286e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:29,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.66135 samples/s/p 1:42:34 } +2024-07-30 04:26:32,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1897/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 4.6659816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:32,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.66055 samples/s/p 1:42:32 } +2024-07-30 04:26:35,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1899/ 3125], loss: 0.394, per_step_time: 1413ms, lr: 4.662534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:35,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.65930 samples/s/p 1:42:30 } +2024-07-30 04:26:38,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1901/ 3125], loss: 0.136, per_step_time: 1412ms, lr: 4.659087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:38,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.66212 samples/s/p 1:42:24 } +2024-07-30 04:26:41,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1903/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 4.655641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:41,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.66004 samples/s/p 1:42:24 } +2024-07-30 04:26:43,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1905/ 3125], loss: 0.525, per_step_time: 1412ms, lr: 4.652194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:43,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.66208 samples/s/p 1:42:19 } +2024-07-30 04:26:46,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1907/ 3125], loss: 0.129, per_step_time: 1413ms, lr: 4.648748e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:46,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.65984 samples/s/p 1:42:18 } +2024-07-30 04:26:49,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1909/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 4.6453015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:49,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.65946 samples/s/p 1:42:16 } +2024-07-30 04:26:52,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1911/ 3125], loss: 0.398, per_step_time: 1413ms, lr: 4.6418545e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:52,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.66147 samples/s/p 1:42:11 } +2024-07-30 04:26:55,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1913/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 4.6384084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:55,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.66044 samples/s/p 1:42:09 } +2024-07-30 04:26:58,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1915/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 4.6349633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:58,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.66136 samples/s/p 1:42:05 } +2024-07-30 04:27:00,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1917/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 4.6315176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:00,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.66003 samples/s/p 1:42:04 } +2024-07-30 04:27:03,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1919/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 4.6280725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:03,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.66046 samples/s/p 1:42:01 } +2024-07-30 04:27:06,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1921/ 3125], loss: 0.118, per_step_time: 1414ms, lr: 4.624627e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:06,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.65752 samples/s/p 1:42:01 } +2024-07-30 04:27:09,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1923/ 3125], loss: 0.213, per_step_time: 1415ms, lr: 4.621182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:09,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.65308 samples/s/p 1:42:03 } +2024-07-30 04:27:12,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1925/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 4.617736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:12,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.65801 samples/s/p 1:41:55 } +2024-07-30 04:27:15,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1927/ 3125], loss: 0.150, per_step_time: 1414ms, lr: 4.614292e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:15,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.65704 samples/s/p 1:41:53 } +2024-07-30 04:27:17,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1929/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 4.6108476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:17,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.65951 samples/s/p 1:41:47 } +2024-07-30 04:27:20,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1931/ 3125], loss: 0.541, per_step_time: 1413ms, lr: 4.6074033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:20,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.66113 samples/s/p 1:41:43 } +2024-07-30 04:27:23,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1933/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 4.603959e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:23,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.65930 samples/s/p 1:41:42 } +2024-07-30 04:27:26,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1935/ 3125], loss: 0.469, per_step_time: 1413ms, lr: 4.6005152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:26,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.65854 samples/s/p 1:41:40 } +2024-07-30 04:27:29,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1937/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 4.5970714e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:29,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.65994 samples/s/p 1:41:36 } +2024-07-30 04:27:32,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1939/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 4.593627e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:32,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |███████████████████████████ | 5.66018 samples/s/p 1:41:33 } +2024-07-30 04:27:34,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1941/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 4.590184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:34,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |███████████████████████████ | 5.66045 samples/s/p 1:41:29 } +2024-07-30 04:27:37,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1943/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 4.586741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:37,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.66031 samples/s/p 1:41:27 } +2024-07-30 04:27:40,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1945/ 3125], loss: 0.203, per_step_time: 1414ms, lr: 4.5832976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:40,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.65424 samples/s/p 1:41:30 } +2024-07-30 04:27:43,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1947/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 4.579855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:43,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.65996 samples/s/p 1:41:22 } +2024-07-30 04:27:46,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1949/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 4.5764127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:46,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.65857 samples/s/p 1:41:20 } +2024-07-30 04:27:49,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1951/ 3125], loss: 0.128, per_step_time: 1414ms, lr: 4.5729703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:49,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.65677 samples/s/p 1:41:19 } +2024-07-30 04:27:51,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1953/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 4.5695274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:51,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.65930 samples/s/p 1:41:14 } +2024-07-30 04:27:54,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1955/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 4.5660854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:54,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.65862 samples/s/p 1:41:12 } +2024-07-30 04:27:57,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1957/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 4.5626434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:57,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.66090 samples/s/p 1:41:06 } +2024-07-30 04:28:00,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1959/ 3125], loss: 0.388, per_step_time: 1413ms, lr: 4.559202e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:00,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.65968 samples/s/p 1:41:05 } +2024-07-30 04:28:03,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1961/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 4.555761e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:03,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.66075 samples/s/p 1:41:01 } +2024-07-30 04:28:06,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1963/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 4.55232e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:06,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.66062 samples/s/p 1:40:58 } +2024-07-30 04:28:08,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1965/ 3125], loss: 0.447, per_step_time: 1412ms, lr: 4.5488787e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:08,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.66176 samples/s/p 1:40:54 } +2024-07-30 04:28:11,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1967/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 4.5454376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:11,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.66116 samples/s/p 1:40:52 } +2024-07-30 04:28:14,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1969/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 4.5419965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:14,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.66118 samples/s/p 1:40:49 } +2024-07-30 04:28:17,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1971/ 3125], loss: 0.551, per_step_time: 1413ms, lr: 4.538557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:17,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.65987 samples/s/p 1:40:48 } +2024-07-30 04:28:20,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1973/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 4.535117e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:20,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.66084 samples/s/p 1:40:44 } +2024-07-30 04:28:23,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1975/ 3125], loss: 0.281, per_step_time: 1414ms, lr: 4.5316774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:23,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.65716 samples/s/p 1:40:45 } +2024-07-30 04:28:25,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1977/ 3125], loss: 0.380, per_step_time: 1413ms, lr: 4.5282372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:25,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.66102 samples/s/p 1:40:38 } +2024-07-30 04:28:28,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1979/ 3125], loss: 0.150, per_step_time: 1414ms, lr: 4.5247984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:28,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.65459 samples/s/p 1:40:42 } +2024-07-30 04:28:31,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1981/ 3125], loss: 0.378, per_step_time: 1412ms, lr: 4.521359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:31,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.66247 samples/s/p 1:40:31 } +2024-07-30 04:28:34,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1983/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 4.5179195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:34,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.66060 samples/s/p 1:40:30 } +2024-07-30 04:28:37,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1985/ 3125], loss: 0.598, per_step_time: 1413ms, lr: 4.5144807e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:37,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.65844 samples/s/p 1:40:29 } +2024-07-30 04:28:40,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1987/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 4.511043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:40,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.66108 samples/s/p 1:40:24 } +2024-07-30 04:28:42,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1989/ 3125], loss: 0.072, per_step_time: 1412ms, lr: 4.507604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:42,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.66313 samples/s/p 1:40:19 } +2024-07-30 04:28:45,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1991/ 3125], loss: 0.251, per_step_time: 1412ms, lr: 4.504166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:45,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.66284 samples/s/p 1:40:16 } +2024-07-30 04:28:48,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1993/ 3125], loss: 0.312, per_step_time: 1414ms, lr: 4.5007287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:48,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.65725 samples/s/p 1:40:19 } +2024-07-30 04:28:51,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1995/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 4.4972912e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:51,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.65964 samples/s/p 1:40:14 } +2024-07-30 04:28:54,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1997/ 3125], loss: 0.273, per_step_time: 1414ms, lr: 4.493853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:54,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.65724 samples/s/p 1:40:14 } +2024-07-30 04:28:57,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1999/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 4.4904164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:57,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.65792 samples/s/p 1:40:10 } +2024-07-30 04:28:59,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2001/ 3125], loss: 0.130, per_step_time: 1413ms, lr: 4.486979e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:59,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.65778 samples/s/p 1:40:08 } +2024-07-30 04:29:02,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2003/ 3125], loss: 0.446, per_step_time: 1413ms, lr: 4.483543e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:02,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.66038 samples/s/p 1:40:02 } +2024-07-30 04:29:05,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2005/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 4.480107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:05,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.66045 samples/s/p 1:39:59 } +2024-07-30 04:29:08,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2007/ 3125], loss: 0.148, per_step_time: 1413ms, lr: 4.4766707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:08,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.65990 samples/s/p 1:39:57 } +2024-07-30 04:29:11,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2009/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 4.4732346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:11,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.66062 samples/s/p 1:39:53 } +2024-07-30 04:29:14,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2011/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 4.4697986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:14,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.66021 samples/s/p 1:39:51 } +2024-07-30 04:29:16,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2013/ 3125], loss: 0.226, per_step_time: 1414ms, lr: 4.466363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:16,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.65670 samples/s/p 1:39:52 } +2024-07-30 04:29:19,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2015/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 4.4629282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:19,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.66117 samples/s/p 1:39:44 } +2024-07-30 04:29:22,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2017/ 3125], loss: 0.346, per_step_time: 1413ms, lr: 4.4594935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:22,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.65968 samples/s/p 1:39:43 } +2024-07-30 04:29:25,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2019/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 4.4560597e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:25,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.65801 samples/s/p 1:39:42 } +2024-07-30 04:29:28,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2021/ 3125], loss: 0.144, per_step_time: 1414ms, lr: 4.4526246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:28,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.65449 samples/s/p 1:39:43 } +2024-07-30 04:29:31,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2023/ 3125], loss: 0.206, per_step_time: 1414ms, lr: 4.449191e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:31,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.65692 samples/s/p 1:39:37 } +2024-07-30 04:29:33,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2025/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 4.445756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:33,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.65581 samples/s/p 1:39:36 } +2024-07-30 04:29:36,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2027/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 4.442323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:36,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.65956 samples/s/p 1:39:29 } +2024-07-30 04:29:39,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2029/ 3125], loss: 0.114, per_step_time: 1425ms, lr: 4.4388903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:39,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.61393 samples/s/p 1:40:15 } +2024-07-30 04:29:42,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2031/ 3125], loss: 0.126, per_step_time: 1415ms, lr: 4.435457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:42,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.65204 samples/s/p 1:39:31 } +2024-07-30 04:29:45,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2033/ 3125], loss: 0.208, per_step_time: 1412ms, lr: 4.432024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:45,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.66258 samples/s/p 1:39:17 } +2024-07-30 04:29:48,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2035/ 3125], loss: 0.228, per_step_time: 1412ms, lr: 4.428592e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:48,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.66260 samples/s/p 1:39:14 } +2024-07-30 04:29:50,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2037/ 3125], loss: 0.384, per_step_time: 1413ms, lr: 4.42516e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:50,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.66015 samples/s/p 1:39:14 } +2024-07-30 04:29:53,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2039/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 4.4217286e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:53,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.66018 samples/s/p 1:39:11 } +2024-07-30 04:29:56,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2041/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 4.4182957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:56,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.66147 samples/s/p 1:39:07 } +2024-07-30 04:29:59,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2043/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 4.414865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:59,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.65834 samples/s/p 1:39:08 } +2024-07-30 04:30:02,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2045/ 3125], loss: 0.360, per_step_time: 1412ms, lr: 4.4114336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:02,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.66262 samples/s/p 1:39:00 } +2024-07-30 04:30:05,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2047/ 3125], loss: 0.136, per_step_time: 1442ms, lr: 4.408003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:05,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.54534 samples/s/p 1:41:03 } +2024-07-30 04:30:08,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2049/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 4.404573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:08,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.65997 samples/s/p 1:38:57 } +2024-07-30 04:30:10,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2051/ 3125], loss: 0.457, per_step_time: 1413ms, lr: 4.4011426e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:10,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.66046 samples/s/p 1:38:54 } +2024-07-30 04:30:13,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2053/ 3125], loss: 0.081, per_step_time: 1413ms, lr: 4.3977125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:13,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.66119 samples/s/p 1:38:50 } +2024-07-30 04:30:16,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2055/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 4.3942828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:16,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.66078 samples/s/p 1:38:48 } +2024-07-30 04:30:19,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2057/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 4.390853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:19,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.65982 samples/s/p 1:38:46 } +2024-07-30 04:30:22,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2059/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 4.387424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:22,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.65952 samples/s/p 1:38:44 } +2024-07-30 04:30:25,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2061/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 4.3839955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:25,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.65913 samples/s/p 1:38:41 } +2024-07-30 04:30:27,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2063/ 3125], loss: 0.240, per_step_time: 1414ms, lr: 4.380567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:27,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.65742 samples/s/p 1:38:40 } +2024-07-30 04:30:30,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2065/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 4.377139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:30,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.65954 samples/s/p 1:38:35 } +2024-07-30 04:30:33,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2067/ 3125], loss: 0.456, per_step_time: 1413ms, lr: 4.3737114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:33,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.65879 samples/s/p 1:38:33 } +2024-07-30 04:30:36,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2069/ 3125], loss: 0.345, per_step_time: 1412ms, lr: 4.3702826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:36,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.66269 samples/s/p 1:38:26 } +2024-07-30 04:30:39,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2071/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 4.3668556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:39,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.66018 samples/s/p 1:38:26 } +2024-07-30 04:30:42,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2073/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 4.3634286e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:42,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.65939 samples/s/p 1:38:24 } +2024-07-30 04:30:44,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2075/ 3125], loss: 0.453, per_step_time: 1413ms, lr: 4.3600025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:44,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.65866 samples/s/p 1:38:22 } +2024-07-30 04:30:47,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2077/ 3125], loss: 0.347, per_step_time: 1415ms, lr: 4.3565756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:47,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.65334 samples/s/p 1:38:25 } +2024-07-30 04:30:50,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2079/ 3125], loss: 0.239, per_step_time: 1414ms, lr: 4.35315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:50,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.65443 samples/s/p 1:38:21 } +2024-07-30 04:30:53,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2081/ 3125], loss: 0.294, per_step_time: 1414ms, lr: 4.3497243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:53,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.65682 samples/s/p 1:38:15 } +2024-07-30 04:30:56,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2083/ 3125], loss: 0.231, per_step_time: 1416ms, lr: 4.346298e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:56,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.64608 samples/s/p 1:38:24 } +2024-07-30 04:30:59,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2085/ 3125], loss: 0.124, per_step_time: 1413ms, lr: 4.342873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:59,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.66005 samples/s/p 1:38:06 } +2024-07-30 04:31:01,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2087/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 4.339449e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:01,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.66045 samples/s/p 1:38:03 } +2024-07-30 04:31:04,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2089/ 3125], loss: 0.176, per_step_time: 1412ms, lr: 4.3360237e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:04,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.66256 samples/s/p 1:37:58 } +2024-07-30 04:31:07,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2091/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 4.3326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:07,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.66092 samples/s/p 1:37:57 } +2024-07-30 04:31:10,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2093/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 4.329176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:10,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.66167 samples/s/p 1:37:53 } +2024-07-30 04:31:13,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2095/ 3125], loss: 0.234, per_step_time: 1412ms, lr: 4.3257533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:13,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.66212 samples/s/p 1:37:50 } +2024-07-30 04:31:16,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2097/ 3125], loss: 0.252, per_step_time: 1412ms, lr: 4.3223286e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:16,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.66206 samples/s/p 1:37:47 } +2024-07-30 04:31:18,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2099/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 4.318906e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:18,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.65982 samples/s/p 1:37:47 } +2024-07-30 04:31:21,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2101/ 3125], loss: 0.409, per_step_time: 1412ms, lr: 4.3154832e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:21,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.66326 samples/s/p 1:37:40 } +2024-07-30 04:31:24,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2103/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 4.3120613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:24,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.65994 samples/s/p 1:37:41 } +2024-07-30 04:31:27,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2105/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 4.3086397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:27,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.66073 samples/s/p 1:37:37 } +2024-07-30 04:31:30,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2107/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 4.305218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:30,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.66025 samples/s/p 1:37:35 } +2024-07-30 04:31:33,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2109/ 3125], loss: 0.384, per_step_time: 1413ms, lr: 4.3017967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:33,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.65793 samples/s/p 1:37:35 } +2024-07-30 04:31:35,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2111/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 4.298376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:35,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.66072 samples/s/p 1:37:29 } +2024-07-30 04:31:38,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2113/ 3125], loss: 0.296, per_step_time: 1414ms, lr: 4.2949546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:38,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.65760 samples/s/p 1:37:29 } +2024-07-30 04:31:41,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2115/ 3125], loss: 0.449, per_step_time: 1413ms, lr: 4.2915344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:41,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.66074 samples/s/p 1:37:23 } +2024-07-30 04:31:44,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2117/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 4.2881147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:44,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.65914 samples/s/p 1:37:22 } +2024-07-30 04:31:47,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2119/ 3125], loss: 0.334, per_step_time: 1413ms, lr: 4.2846955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:47,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.66025 samples/s/p 1:37:18 } +2024-07-30 04:31:50,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2121/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 4.281276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:50,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |███████████████████████████ | 5.66102 samples/s/p 1:37:14 } +2024-07-30 04:31:52,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2123/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 4.2778574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:52,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |███████████████████████████ | 5.65932 samples/s/p 1:37:13 } +2024-07-30 04:31:55,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2125/ 3125], loss: 0.325, per_step_time: 1414ms, lr: 4.274439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:55,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.65649 samples/s/p 1:37:14 } +2024-07-30 04:31:58,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2127/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 4.27102e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:58,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.66035 samples/s/p 1:37:07 } +2024-07-30 04:32:01,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2129/ 3125], loss: 0.390, per_step_time: 1413ms, lr: 4.2676024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:01,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.65850 samples/s/p 1:37:06 } +2024-07-30 04:32:04,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2131/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 4.264185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:04,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.66116 samples/s/p 1:37:00 } +2024-07-30 04:32:07,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2133/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 4.2607676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:07,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.65995 samples/s/p 1:36:59 } +2024-07-30 04:32:09,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2135/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 4.257351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:09,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.66107 samples/s/p 1:36:55 } +2024-07-30 04:32:12,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2137/ 3125], loss: 0.383, per_step_time: 1413ms, lr: 4.253935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:12,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.65954 samples/s/p 1:36:53 } +2024-07-30 04:32:15,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2139/ 3125], loss: 0.202, per_step_time: 1415ms, lr: 4.250519e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:15,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.65163 samples/s/p 1:36:59 } +2024-07-30 04:32:18,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2141/ 3125], loss: 0.498, per_step_time: 1413ms, lr: 4.2471024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:18,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.66098 samples/s/p 1:36:46 } +2024-07-30 04:32:21,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2143/ 3125], loss: 0.146, per_step_time: 1414ms, lr: 4.2436873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:21,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.65684 samples/s/p 1:36:48 } +2024-07-30 04:32:24,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2145/ 3125], loss: 0.457, per_step_time: 1413ms, lr: 4.240272e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:24,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.65853 samples/s/p 1:36:43 } +2024-07-30 04:32:26,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2147/ 3125], loss: 0.206, per_step_time: 1414ms, lr: 4.2368574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:26,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.65560 samples/s/p 1:36:43 } +2024-07-30 04:32:29,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2149/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 4.2334436e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:29,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.66077 samples/s/p 1:36:35 } +2024-07-30 04:32:32,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2151/ 3125], loss: 0.194, per_step_time: 1414ms, lr: 4.23003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:32,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.65553 samples/s/p 1:36:38 } +2024-07-30 04:32:35,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2153/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 4.226616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:35,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.65772 samples/s/p 1:36:33 } +2024-07-30 04:32:38,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2155/ 3125], loss: 0.256, per_step_time: 1418ms, lr: 4.2232023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:38,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.63830 samples/s/p 1:36:50 } +2024-07-30 04:32:41,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2157/ 3125], loss: 0.396, per_step_time: 1414ms, lr: 4.2197894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:41,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.65528 samples/s/p 1:36:29 } +2024-07-30 04:32:43,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2159/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 4.216377e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:43,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.65949 samples/s/p 1:36:22 } +2024-07-30 04:32:46,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2161/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 4.2129655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:46,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.65908 samples/s/p 1:36:20 } +2024-07-30 04:32:49,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2163/ 3125], loss: 0.292, per_step_time: 1414ms, lr: 4.209554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:49,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.65712 samples/s/p 1:36:19 } +2024-07-30 04:32:52,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2165/ 3125], loss: 0.289, per_step_time: 1412ms, lr: 4.2061424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:52,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.66189 samples/s/p 1:36:11 } +2024-07-30 04:32:55,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2167/ 3125], loss: 0.211, per_step_time: 1414ms, lr: 4.2027314e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:55,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.65432 samples/s/p 1:36:16 } +2024-07-30 04:32:58,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2169/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 4.19932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:58,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.66152 samples/s/p 1:36:06 } +2024-07-30 04:33:00,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2171/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 4.19591e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:00,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.66150 samples/s/p 1:36:03 } +2024-07-30 04:33:03,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2173/ 3125], loss: 0.463, per_step_time: 1413ms, lr: 4.1925005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:03,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.66092 samples/s/p 1:36:01 } +2024-07-30 04:33:06,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2175/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 4.1890917e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:06,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.65844 samples/s/p 1:36:01 } +2024-07-30 04:33:09,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2177/ 3125], loss: 0.359, per_step_time: 1412ms, lr: 4.185682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:09,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.66197 samples/s/p 1:35:54 } +2024-07-30 04:33:12,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2179/ 3125], loss: 0.340, per_step_time: 1412ms, lr: 4.1822736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:12,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.66200 samples/s/p 1:35:52 } +2024-07-30 04:33:15,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2181/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 4.1788658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:15,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.65958 samples/s/p 1:35:51 } +2024-07-30 04:33:17,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2183/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 4.1754583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:17,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.65946 samples/s/p 1:35:48 } +2024-07-30 04:33:20,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2185/ 3125], loss: 0.204, per_step_time: 1412ms, lr: 4.1720496e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:20,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.66175 samples/s/p 1:35:43 } +2024-07-30 04:33:23,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2187/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 4.168643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:23,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.65790 samples/s/p 1:35:44 } +2024-07-30 04:33:26,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2189/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 4.165236e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:26,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.65954 samples/s/p 1:35:40 } +2024-07-30 04:33:29,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2191/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 4.16183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:29,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.65973 samples/s/p 1:35:37 } +2024-07-30 04:33:32,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2193/ 3125], loss: 0.481, per_step_time: 1413ms, lr: 4.1584244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:32,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.65941 samples/s/p 1:35:34 } +2024-07-30 04:33:34,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2195/ 3125], loss: 0.492, per_step_time: 1414ms, lr: 4.1550193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:34,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.65554 samples/s/p 1:35:35 } +2024-07-30 04:33:37,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2197/ 3125], loss: 0.273, per_step_time: 1415ms, lr: 4.1516146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:37,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.65286 samples/s/p 1:35:35 } +2024-07-30 04:33:40,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2199/ 3125], loss: 0.272, per_step_time: 1414ms, lr: 4.148209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:40,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.65717 samples/s/p 1:35:28 } +2024-07-30 04:33:43,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2201/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 4.1448043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:43,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.65951 samples/s/p 1:35:23 } +2024-07-30 04:33:46,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2203/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 4.141401e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:46,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.66100 samples/s/p 1:35:19 } +2024-07-30 04:33:49,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2205/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 4.1379976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:49,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.66004 samples/s/p 1:35:17 } +2024-07-30 04:33:51,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2207/ 3125], loss: 0.235, per_step_time: 1413ms, lr: 4.1345947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:51,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.66139 samples/s/p 1:35:13 } +2024-07-30 04:33:54,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2209/ 3125], loss: 0.401, per_step_time: 1412ms, lr: 4.131192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:54,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.66251 samples/s/p 1:35:09 } +2024-07-30 04:33:57,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2211/ 3125], loss: 0.233, per_step_time: 1412ms, lr: 4.12779e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:57,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.66225 samples/s/p 1:35:06 } +2024-07-30 04:34:00,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2213/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 4.1243875e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:00,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.66125 samples/s/p 1:35:04 } +2024-07-30 04:34:03,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2215/ 3125], loss: 0.232, per_step_time: 1412ms, lr: 4.1209864e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:03,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.66318 samples/s/p 1:34:59 } +2024-07-30 04:34:06,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2217/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 4.117586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:06,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.66049 samples/s/p 1:34:59 } +2024-07-30 04:34:08,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2219/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 4.1141857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:08,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.66005 samples/s/p 1:34:57 } +2024-07-30 04:34:11,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2221/ 3125], loss: 0.216, per_step_time: 1412ms, lr: 4.110785e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:11,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.66196 samples/s/p 1:34:52 } +2024-07-30 04:34:14,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2223/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 4.1073854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:14,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.65877 samples/s/p 1:34:53 } +2024-07-30 04:34:17,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2225/ 3125], loss: 0.285, per_step_time: 1414ms, lr: 4.1039866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:17,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.65735 samples/s/p 1:34:51 } +2024-07-30 04:34:20,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2227/ 3125], loss: 0.265, per_step_time: 1414ms, lr: 4.1005865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:20,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.65537 samples/s/p 1:34:50 } +2024-07-30 04:34:23,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2229/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 4.0971886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:23,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.65886 samples/s/p 1:34:44 } +2024-07-30 04:34:25,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2231/ 3125], loss: 0.579, per_step_time: 1413ms, lr: 4.093791e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:25,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.65788 samples/s/p 1:34:42 } +2024-07-30 04:34:28,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2233/ 3125], loss: 0.166, per_step_time: 1414ms, lr: 4.0903933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:28,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.65726 samples/s/p 1:34:40 } +2024-07-30 04:34:31,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2235/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 4.0869963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:31,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.66123 samples/s/p 1:34:33 } +2024-07-30 04:34:34,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2237/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 4.0836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:34,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.65973 samples/s/p 1:34:32 } +2024-07-30 04:34:37,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2239/ 3125], loss: 0.324, per_step_time: 1414ms, lr: 4.080204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:37,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.65376 samples/s/p 1:34:35 } +2024-07-30 04:34:40,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2241/ 3125], loss: 0.142, per_step_time: 1412ms, lr: 4.0768073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:40,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.66257 samples/s/p 1:34:23 } +2024-07-30 04:34:42,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2243/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 4.073412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:42,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.65843 samples/s/p 1:34:25 } +2024-07-30 04:34:45,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2245/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 4.070017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:45,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.66029 samples/s/p 1:34:20 } +2024-07-30 04:34:48,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2247/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 4.0666228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:48,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.65707 samples/s/p 1:34:20 } +2024-07-30 04:34:51,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2249/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 4.063229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:51,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.65861 samples/s/p 1:34:16 } +2024-07-30 04:34:54,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2251/ 3125], loss: 0.205, per_step_time: 1414ms, lr: 4.0598356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:54,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.65716 samples/s/p 1:34:15 } +2024-07-30 04:34:57,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2253/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 4.056443e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:57,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.66115 samples/s/p 1:34:08 } +2024-07-30 04:34:59,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2255/ 3125], loss: 0.197, per_step_time: 1414ms, lr: 4.0530504e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:59,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.65762 samples/s/p 1:34:09 } +2024-07-30 04:35:02,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2257/ 3125], loss: 0.380, per_step_time: 1414ms, lr: 4.049657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:02,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.65701 samples/s/p 1:34:06 } +2024-07-30 04:35:05,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2259/ 3125], loss: 0.338, per_step_time: 1414ms, lr: 4.0462655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:05,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.65395 samples/s/p 1:34:07 } +2024-07-30 04:35:08,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2261/ 3125], loss: 0.310, per_step_time: 1412ms, lr: 4.0428745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:08,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.66234 samples/s/p 1:33:55 } +2024-07-30 04:35:11,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2263/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 4.039484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:11,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.65912 samples/s/p 1:33:56 } +2024-07-30 04:35:14,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2265/ 3125], loss: 0.197, per_step_time: 1412ms, lr: 4.0360937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:14,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.66300 samples/s/p 1:33:49 } +2024-07-30 04:35:16,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2267/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 4.0327036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:16,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.65872 samples/s/p 1:33:50 } +2024-07-30 04:35:19,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2269/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 4.0293144e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:19,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.65902 samples/s/p 1:33:47 } +2024-07-30 04:35:22,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2271/ 3125], loss: 0.302, per_step_time: 1412ms, lr: 4.025924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:22,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.66265 samples/s/p 1:33:41 } +2024-07-30 04:35:25,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2273/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 4.0225364e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:25,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.66128 samples/s/p 1:33:39 } +2024-07-30 04:35:28,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2275/ 3125], loss: 0.459, per_step_time: 1412ms, lr: 4.019148e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:28,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.66180 samples/s/p 1:33:36 } +2024-07-30 04:35:31,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2277/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 4.015761e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:31,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.66082 samples/s/p 1:33:34 } +2024-07-30 04:35:33,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2279/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 4.0123737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:33,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.65964 samples/s/p 1:33:33 } +2024-07-30 04:35:36,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2281/ 3125], loss: 0.136, per_step_time: 1412ms, lr: 4.008987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:36,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.66287 samples/s/p 1:33:27 } +2024-07-30 04:35:39,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2283/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 4.005601e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:39,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.65838 samples/s/p 1:33:28 } +2024-07-30 04:35:42,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2285/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 4.0022146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:42,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.66054 samples/s/p 1:33:23 } +2024-07-30 04:35:45,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2287/ 3125], loss: 0.440, per_step_time: 1413ms, lr: 3.9988295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:45,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.65886 samples/s/p 1:33:22 } +2024-07-30 04:35:48,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2289/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 3.9954452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:48,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.66064 samples/s/p 1:33:17 } +2024-07-30 04:35:50,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2291/ 3125], loss: 0.377, per_step_time: 1412ms, lr: 3.9920606e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:50,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.66210 samples/s/p 1:33:13 } +2024-07-30 04:35:53,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2293/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 3.9886772e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:53,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.65679 samples/s/p 1:33:16 } +2024-07-30 04:35:56,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2295/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 3.985294e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:56,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.66136 samples/s/p 1:33:08 } +2024-07-30 04:35:59,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2297/ 3125], loss: 0.109, per_step_time: 1414ms, lr: 3.9819115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:59,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.65639 samples/s/p 1:33:10 } +2024-07-30 04:36:02,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2299/ 3125], loss: 0.496, per_step_time: 1413ms, lr: 3.978528e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:02,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.65815 samples/s/p 1:33:06 } +2024-07-30 04:36:05,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2301/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 3.9751467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:05,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.65853 samples/s/p 1:33:03 } +2024-07-30 04:36:07,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2303/ 3125], loss: 0.450, per_step_time: 1414ms, lr: 3.9717647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:07,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.65485 samples/s/p 1:33:03 } +2024-07-30 04:36:10,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2305/ 3125], loss: 0.127, per_step_time: 1413ms, lr: 3.9683846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:10,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.65788 samples/s/p 1:32:58 } +2024-07-30 04:36:13,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2307/ 3125], loss: 0.341, per_step_time: 1413ms, lr: 3.9650045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:13,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.66015 samples/s/p 1:32:52 } +2024-07-30 04:36:16,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2309/ 3125], loss: 0.345, per_step_time: 1412ms, lr: 3.9616248e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:16,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |████████████████████████████ | 5.66179 samples/s/p 1:32:48 } +2024-07-30 04:36:19,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2311/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 3.958245e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:19,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |████████████████████████████ | 5.65902 samples/s/p 1:32:48 } +2024-07-30 04:36:22,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2313/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 3.9548663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:22,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.66122 samples/s/p 1:32:43 } +2024-07-30 04:36:24,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2315/ 3125], loss: 0.234, per_step_time: 1412ms, lr: 3.951487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:24,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.66226 samples/s/p 1:32:39 } +2024-07-30 04:36:27,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2317/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 3.9481097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:27,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.66065 samples/s/p 1:32:38 } +2024-07-30 04:36:30,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2319/ 3125], loss: 0.322, per_step_time: 1413ms, lr: 3.9447323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:30,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.66051 samples/s/p 1:32:35 } +2024-07-30 04:36:33,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2321/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 3.9413558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:33,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.66154 samples/s/p 1:32:31 } +2024-07-30 04:36:36,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2323/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 3.9379793e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:36,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.65967 samples/s/p 1:32:30 } +2024-07-30 04:36:39,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2325/ 3125], loss: 0.107, per_step_time: 1412ms, lr: 3.9346037e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:39,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.66237 samples/s/p 1:32:25 } +2024-07-30 04:36:41,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2327/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 3.9312285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:41,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.65987 samples/s/p 1:32:25 } +2024-07-30 04:36:44,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2329/ 3125], loss: 0.462, per_step_time: 1413ms, lr: 3.9278525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:44,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.66138 samples/s/p 1:32:20 } +2024-07-30 04:36:47,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2331/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 3.9244787e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:47,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.66006 samples/s/p 1:32:19 } +2024-07-30 04:36:50,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2333/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 3.921105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:50,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.66003 samples/s/p 1:32:16 } +2024-07-30 04:36:53,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2335/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 3.9177316e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:53,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.65892 samples/s/p 1:32:14 } +2024-07-30 04:36:56,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2337/ 3125], loss: 0.206, per_step_time: 1417ms, lr: 3.914359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:56,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.64275 samples/s/p 1:32:27 } +2024-07-30 04:36:58,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2339/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 3.910987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:58,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.65969 samples/s/p 1:32:08 } +2024-07-30 04:37:01,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2341/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 3.9076153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:01,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.65891 samples/s/p 1:32:06 } +2024-07-30 04:37:04,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2343/ 3125], loss: 0.305, per_step_time: 1414ms, lr: 3.9042434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:04,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.65617 samples/s/p 1:32:05 } +2024-07-30 04:37:07,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2345/ 3125], loss: 0.082, per_step_time: 1413ms, lr: 3.900873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:07,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.66002 samples/s/p 1:31:59 } +2024-07-30 04:37:10,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2347/ 3125], loss: 0.097, per_step_time: 1414ms, lr: 3.897502e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:10,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.65661 samples/s/p 1:31:59 } +2024-07-30 04:37:13,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2349/ 3125], loss: 0.252, per_step_time: 1412ms, lr: 3.894133e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:13,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.66232 samples/s/p 1:31:51 } +2024-07-30 04:37:15,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2351/ 3125], loss: 0.183, per_step_time: 1414ms, lr: 3.890764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:15,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.65666 samples/s/p 1:31:54 } +2024-07-30 04:37:18,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2353/ 3125], loss: 0.421, per_step_time: 1413ms, lr: 3.887396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:18,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.66040 samples/s/p 1:31:47 } +2024-07-30 04:37:21,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2355/ 3125], loss: 0.323, per_step_time: 1412ms, lr: 3.8840276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:21,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.66248 samples/s/p 1:31:42 } +2024-07-30 04:37:24,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2357/ 3125], loss: 0.412, per_step_time: 1414ms, lr: 3.8806597e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:24,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.65480 samples/s/p 1:31:47 } +2024-07-30 04:37:27,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2359/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 3.8772923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:27,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.66012 samples/s/p 1:31:39 } +2024-07-30 04:37:30,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2361/ 3125], loss: 0.202, per_step_time: 1414ms, lr: 3.873926e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:30,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.65720 samples/s/p 1:31:39 } +2024-07-30 04:37:32,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2363/ 3125], loss: 0.151, per_step_time: 1415ms, lr: 3.8705602e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:32,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.65264 samples/s/p 1:31:41 } +2024-07-30 04:37:35,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2365/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 3.867195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:35,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.65785 samples/s/p 1:31:33 } +2024-07-30 04:37:38,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2367/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 3.86383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:38,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.65928 samples/s/p 1:31:29 } +2024-07-30 04:37:41,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2369/ 3125], loss: 0.330, per_step_time: 1415ms, lr: 3.8604658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:41,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.65194 samples/s/p 1:31:33 } +2024-07-30 04:37:44,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2371/ 3125], loss: 0.040, per_step_time: 1414ms, lr: 3.8571015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:44,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.65590 samples/s/p 1:31:26 } +2024-07-30 04:37:47,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2373/ 3125], loss: 0.215, per_step_time: 1412ms, lr: 3.8537382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:47,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.66184 samples/s/p 1:31:18 } +2024-07-30 04:37:49,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2375/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 3.850376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:49,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.65816 samples/s/p 1:31:18 } +2024-07-30 04:37:52,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2377/ 3125], loss: 0.421, per_step_time: 1413ms, lr: 3.8470143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:52,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.66073 samples/s/p 1:31:13 } +2024-07-30 04:37:55,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2379/ 3125], loss: 0.048, per_step_time: 1413ms, lr: 3.8436524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:55,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.66000 samples/s/p 1:31:11 } +2024-07-30 04:37:58,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2381/ 3125], loss: 0.364, per_step_time: 1415ms, lr: 3.8402914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:58,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.65022 samples/s/p 1:31:18 } +2024-07-30 04:38:01,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2383/ 3125], loss: 0.176, per_step_time: 1413ms, lr: 3.8369312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:01,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.65832 samples/s/p 1:31:07 } +2024-07-30 04:38:04,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2385/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 3.8335716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:04,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.65983 samples/s/p 1:31:03 } +2024-07-30 04:38:07,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2387/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 3.8302114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:07,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.65950 samples/s/p 1:31:00 } +2024-07-30 04:38:09,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2389/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 3.826853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:09,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.66116 samples/s/p 1:30:56 } +2024-07-30 04:38:12,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2391/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 3.8234944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:12,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.66088 samples/s/p 1:30:53 } +2024-07-30 04:38:15,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2393/ 3125], loss: 0.215, per_step_time: 1414ms, lr: 3.820137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:15,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.65742 samples/s/p 1:30:54 } +2024-07-30 04:38:18,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2395/ 3125], loss: 0.094, per_step_time: 1413ms, lr: 3.81678e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:18,341 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.65939 samples/s/p 1:30:49 } +2024-07-30 04:38:21,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2397/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 3.8134237e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:21,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.66064 samples/s/p 1:30:45 } +2024-07-30 04:38:24,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2399/ 3125], loss: 0.156, per_step_time: 1415ms, lr: 3.8100677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:24,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.65303 samples/s/p 1:30:49 } +2024-07-30 04:38:26,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2401/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 3.806712e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:26,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.66037 samples/s/p 1:30:39 } +2024-07-30 04:38:29,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2403/ 3125], loss: 0.595, per_step_time: 1413ms, lr: 3.8033568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:29,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.65909 samples/s/p 1:30:38 } +2024-07-30 04:38:32,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2405/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 3.8000028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:32,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.65889 samples/s/p 1:30:35 } +2024-07-30 04:38:35,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2407/ 3125], loss: 0.425, per_step_time: 1414ms, lr: 3.7966493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:35,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.65620 samples/s/p 1:30:35 } +2024-07-30 04:38:38,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2409/ 3125], loss: 0.322, per_step_time: 1413ms, lr: 3.7932964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:38,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.65780 samples/s/p 1:30:31 } +2024-07-30 04:38:41,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2411/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 3.7899433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:41,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.65806 samples/s/p 1:30:28 } +2024-07-30 04:38:43,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2413/ 3125], loss: 0.084, per_step_time: 1413ms, lr: 3.7865918e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:43,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.66079 samples/s/p 1:30:22 } +2024-07-30 04:38:46,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2415/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 3.7832397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:46,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.66143 samples/s/p 1:30:19 } +2024-07-30 04:38:49,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2417/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 3.7798889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:49,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.65976 samples/s/p 1:30:17 } +2024-07-30 04:38:52,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2419/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 3.7765392e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:52,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.65882 samples/s/p 1:30:15 } +2024-07-30 04:38:55,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2421/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 3.7731897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:55,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.66105 samples/s/p 1:30:11 } +2024-07-30 04:38:58,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2423/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 3.7698403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:58,022 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.65834 samples/s/p 1:30:10 } +2024-07-30 04:39:00,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2425/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 3.7664922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:00,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.66006 samples/s/p 1:30:06 } +2024-07-30 04:39:03,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2427/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 3.7631446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:03,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.65925 samples/s/p 1:30:04 } +2024-07-30 04:39:06,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2429/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 3.7597963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:06,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.66072 samples/s/p 1:30:00 } +2024-07-30 04:39:09,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2431/ 3125], loss: 0.176, per_step_time: 1413ms, lr: 3.7564498e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:09,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.65949 samples/s/p 1:29:58 } +2024-07-30 04:39:12,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2433/ 3125], loss: 0.214, per_step_time: 1414ms, lr: 3.753104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:12,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.65534 samples/s/p 1:29:59 } +2024-07-30 04:39:15,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2435/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 3.7497582e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:15,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.65972 samples/s/p 1:29:52 } +2024-07-30 04:39:17,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2437/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 3.7464135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:17,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.65978 samples/s/p 1:29:49 } +2024-07-30 04:39:20,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2439/ 3125], loss: 0.328, per_step_time: 1415ms, lr: 3.7430698e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:20,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.65126 samples/s/p 1:29:54 } +2024-07-30 04:39:23,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2441/ 3125], loss: 0.256, per_step_time: 1414ms, lr: 3.7397258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:23,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.65769 samples/s/p 1:29:45 } +2024-07-30 04:39:26,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2443/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 3.736382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:26,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.66155 samples/s/p 1:29:39 } +2024-07-30 04:39:29,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2445/ 3125], loss: 0.225, per_step_time: 1414ms, lr: 3.73304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:29,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.65699 samples/s/p 1:29:40 } +2024-07-30 04:39:32,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2447/ 3125], loss: 0.306, per_step_time: 1415ms, lr: 3.7296977e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:32,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.65086 samples/s/p 1:29:43 } +2024-07-30 04:39:34,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2449/ 3125], loss: 0.268, per_step_time: 1413ms, lr: 3.7263565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:34,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.65842 samples/s/p 1:29:33 } +2024-07-30 04:39:37,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2451/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 3.7230163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:37,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.65977 samples/s/p 1:29:29 } +2024-07-30 04:39:40,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2453/ 3125], loss: 0.315, per_step_time: 1414ms, lr: 3.7196764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:40,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.65759 samples/s/p 1:29:29 } +2024-07-30 04:39:43,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2455/ 3125], loss: 0.526, per_step_time: 1413ms, lr: 3.7163363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:43,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.65955 samples/s/p 1:29:24 } +2024-07-30 04:39:46,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2457/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 3.712998e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:46,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.66062 samples/s/p 1:29:20 } +2024-07-30 04:39:49,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2459/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 3.7096588e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:49,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.66135 samples/s/p 1:29:17 } +2024-07-30 04:39:51,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2461/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 3.7063216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:51,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.66107 samples/s/p 1:29:14 } +2024-07-30 04:39:54,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2463/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 3.7029847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:54,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.65988 samples/s/p 1:29:12 } +2024-07-30 04:39:57,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2465/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 3.6996487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:57,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.65991 samples/s/p 1:29:09 } +2024-07-30 04:40:00,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2467/ 3125], loss: 0.109, per_step_time: 1413ms, lr: 3.6963124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:00,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.65942 samples/s/p 1:29:07 } +2024-07-30 04:40:03,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2469/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 3.6929775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:03,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.66018 samples/s/p 1:29:04 } +2024-07-30 04:40:06,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2471/ 3125], loss: 0.391, per_step_time: 1413ms, lr: 3.6896433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:06,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.66113 samples/s/p 1:29:00 } +2024-07-30 04:40:08,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2473/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 3.6863087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:08,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.65873 samples/s/p 1:28:59 } +2024-07-30 04:40:11,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2475/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 3.6829756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:11,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.66136 samples/s/p 1:28:54 } +2024-07-30 04:40:11,714 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 04:40:46,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2477/ 3125], loss: 0.064, per_step_time: 1493ms, lr: 3.6796432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:46,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.35809 samples/s/p 1:33:53 } +2024-07-30 04:40:49,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2479/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 3.676311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:49,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.65773 samples/s/p 1:28:52 } +2024-07-30 04:40:51,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2481/ 3125], loss: 0.274, per_step_time: 1412ms, lr: 3.67298e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:51,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.66236 samples/s/p 1:28:44 } +2024-07-30 04:40:54,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2483/ 3125], loss: 0.118, per_step_time: 1413ms, lr: 3.6696492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:54,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.65897 samples/s/p 1:28:45 } +2024-07-30 04:40:57,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2485/ 3125], loss: 0.181, per_step_time: 1415ms, lr: 3.6663198e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:57,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.65131 samples/s/p 1:28:49 } +2024-07-30 04:41:00,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2487/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 3.662989e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:00,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.65907 samples/s/p 1:28:39 } +2024-07-30 04:41:03,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2489/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 3.6596607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:03,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.66128 samples/s/p 1:28:34 } +2024-07-30 04:41:06,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2491/ 3125], loss: 0.308, per_step_time: 1415ms, lr: 3.6563322e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:06,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.64991 samples/s/p 1:28:42 } +2024-07-30 04:41:08,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2493/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 3.6530046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:08,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.65889 samples/s/p 1:28:31 } +2024-07-30 04:41:11,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2495/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 3.649678e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:11,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.65930 samples/s/p 1:28:28 } +2024-07-30 04:41:14,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2497/ 3125], loss: 0.399, per_step_time: 1415ms, lr: 3.6463523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:14,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |█████████████████████████████ | 5.65074 samples/s/p 1:28:33 } +2024-07-30 04:41:17,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2499/ 3125], loss: 0.359, per_step_time: 1414ms, lr: 3.6430263e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:17,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |█████████████████████████████ | 5.65722 samples/s/p 1:28:24 } +2024-07-30 04:41:20,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2501/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 3.639701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:20,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.66087 samples/s/p 1:28:18 } +2024-07-30 04:41:23,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2503/ 3125], loss: 0.176, per_step_time: 1414ms, lr: 3.6363765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:23,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.65749 samples/s/p 1:28:18 } +2024-07-30 04:41:25,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2505/ 3125], loss: 0.574, per_step_time: 1424ms, lr: 3.633053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:25,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.61469 samples/s/p 1:28:55 } +2024-07-30 04:41:28,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2507/ 3125], loss: 0.181, per_step_time: 1415ms, lr: 3.6297301e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:28,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.65248 samples/s/p 1:28:17 } +2024-07-30 04:41:31,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2509/ 3125], loss: 0.202, per_step_time: 1414ms, lr: 3.6264082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:31,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.65629 samples/s/p 1:28:11 } +2024-07-30 04:41:34,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2511/ 3125], loss: 0.570, per_step_time: 1414ms, lr: 3.623086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:34,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.65425 samples/s/p 1:28:10 } +2024-07-30 04:41:37,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2513/ 3125], loss: 0.220, per_step_time: 1412ms, lr: 3.6197655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:37,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.66181 samples/s/p 1:28:00 } +2024-07-30 04:41:40,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2515/ 3125], loss: 0.619, per_step_time: 1413ms, lr: 3.616444e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:40,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.65857 samples/s/p 1:28:00 } +2024-07-30 04:41:42,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2517/ 3125], loss: 0.422, per_step_time: 1414ms, lr: 3.6131246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:42,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.65548 samples/s/p 1:28:00 } +2024-07-30 04:41:45,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2519/ 3125], loss: 0.370, per_step_time: 1414ms, lr: 3.6098056e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:45,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.65572 samples/s/p 1:27:57 } +2024-07-30 04:41:48,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2521/ 3125], loss: 0.499, per_step_time: 1413ms, lr: 3.6064878e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:48,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.66080 samples/s/p 1:27:49 } +2024-07-30 04:41:51,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2523/ 3125], loss: 0.164, per_step_time: 1429ms, lr: 3.6031697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:51,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.59635 samples/s/p 1:28:47 } +2024-07-30 04:41:54,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2525/ 3125], loss: 0.048, per_step_time: 1412ms, lr: 3.5998528e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:54,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.66189 samples/s/p 1:27:43 } +2024-07-30 04:41:57,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2527/ 3125], loss: 0.453, per_step_time: 1414ms, lr: 3.5965368e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:57,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.65496 samples/s/p 1:27:46 } +2024-07-30 04:42:00,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2529/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 3.5932212e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:00,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.65827 samples/s/p 1:27:40 } +2024-07-30 04:42:02,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2531/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 3.5899054e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:02,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.65993 samples/s/p 1:27:36 } +2024-07-30 04:42:05,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2533/ 3125], loss: 0.200, per_step_time: 1414ms, lr: 3.5865914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:05,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.65481 samples/s/p 1:27:38 } +2024-07-30 04:42:08,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2535/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 3.5832775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:08,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.65900 samples/s/p 1:27:31 } +2024-07-30 04:42:11,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2537/ 3125], loss: 0.054, per_step_time: 1414ms, lr: 3.5799646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:11,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.65768 samples/s/p 1:27:30 } +2024-07-30 04:42:14,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2539/ 3125], loss: 0.462, per_step_time: 1413ms, lr: 3.5766523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:14,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.65840 samples/s/p 1:27:26 } +2024-07-30 04:42:17,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2541/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 3.573341e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:17,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.66027 samples/s/p 1:27:22 } +2024-07-30 04:42:19,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2543/ 3125], loss: 0.343, per_step_time: 1414ms, lr: 3.5700302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:19,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.65609 samples/s/p 1:27:23 } +2024-07-30 04:42:22,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2545/ 3125], loss: 0.206, per_step_time: 1414ms, lr: 3.5667192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:22,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.65632 samples/s/p 1:27:20 } +2024-07-30 04:42:25,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2547/ 3125], loss: 0.118, per_step_time: 1415ms, lr: 3.563409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:25,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.65298 samples/s/p 1:27:20 } +2024-07-30 04:42:28,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2549/ 3125], loss: 0.230, per_step_time: 1414ms, lr: 3.5601004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:28,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.65736 samples/s/p 1:27:13 } +2024-07-30 04:42:31,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2551/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 3.5567923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:31,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.66150 samples/s/p 1:27:06 } +2024-07-30 04:42:34,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2553/ 3125], loss: 0.078, per_step_time: 1414ms, lr: 3.5534852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:34,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.65555 samples/s/p 1:27:09 } +2024-07-30 04:42:36,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2555/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 3.5501782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:36,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.65429 samples/s/p 1:27:07 } +2024-07-30 04:42:39,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2557/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 3.546872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:39,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.66045 samples/s/p 1:26:59 } +2024-07-30 04:42:42,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2559/ 3125], loss: 0.431, per_step_time: 1413ms, lr: 3.5435658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:42,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.66049 samples/s/p 1:26:56 } +2024-07-30 04:42:45,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2561/ 3125], loss: 0.240, per_step_time: 1412ms, lr: 3.5402613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:45,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.66189 samples/s/p 1:26:52 } +2024-07-30 04:42:48,231 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2563/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 3.5369574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:48,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.65910 samples/s/p 1:26:52 } +2024-07-30 04:42:51,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2565/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 3.533654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:51,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.65956 samples/s/p 1:26:48 } +2024-07-30 04:42:53,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2567/ 3125], loss: 0.426, per_step_time: 1413ms, lr: 3.5303517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:53,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.65986 samples/s/p 1:26:45 } +2024-07-30 04:42:56,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2569/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 3.5270493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:56,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.65978 samples/s/p 1:26:43 } +2024-07-30 04:42:59,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2571/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 3.5237483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:59,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.66101 samples/s/p 1:26:39 } +2024-07-30 04:43:02,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2573/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 3.5204469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:02,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.65950 samples/s/p 1:26:37 } +2024-07-30 04:43:05,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2575/ 3125], loss: 0.327, per_step_time: 1414ms, lr: 3.5171472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:05,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.65484 samples/s/p 1:26:39 } +2024-07-30 04:43:08,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2577/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 3.5138485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:08,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.66107 samples/s/p 1:26:30 } +2024-07-30 04:43:10,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2579/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 3.5105502e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:10,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.65644 samples/s/p 1:26:31 } +2024-07-30 04:43:13,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2581/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 3.5072524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:13,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.66134 samples/s/p 1:26:24 } +2024-07-30 04:43:16,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2583/ 3125], loss: 0.098, per_step_time: 1413ms, lr: 3.5039554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:16,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.65968 samples/s/p 1:26:23 } +2024-07-30 04:43:19,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2585/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 3.5006594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:19,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.65849 samples/s/p 1:26:21 } +2024-07-30 04:43:22,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2587/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 3.4973639e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:22,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.65385 samples/s/p 1:26:23 } +2024-07-30 04:43:25,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2589/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 3.4940683e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:25,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.65991 samples/s/p 1:26:14 } +2024-07-30 04:43:27,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2591/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 3.4907746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:27,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.66088 samples/s/p 1:26:10 } +2024-07-30 04:43:30,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2593/ 3125], loss: 0.070, per_step_time: 1414ms, lr: 3.4874804e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:30,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.65479 samples/s/p 1:26:13 } +2024-07-30 04:43:33,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2595/ 3125], loss: 0.266, per_step_time: 1414ms, lr: 3.4841883e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:33,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.65719 samples/s/p 1:26:08 } +2024-07-30 04:43:36,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2597/ 3125], loss: 0.341, per_step_time: 1414ms, lr: 3.4808963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:36,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.65661 samples/s/p 1:26:06 } +2024-07-30 04:43:39,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2599/ 3125], loss: 0.383, per_step_time: 1414ms, lr: 3.4776056e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:39,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.65487 samples/s/p 1:26:05 } +2024-07-30 04:43:42,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2601/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 3.4743143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:42,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.65814 samples/s/p 1:25:59 } +2024-07-30 04:43:44,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2603/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 3.4710242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:44,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.65986 samples/s/p 1:25:54 } +2024-07-30 04:43:47,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2605/ 3125], loss: 0.440, per_step_time: 1413ms, lr: 3.467735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:47,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.65998 samples/s/p 1:25:51 } +2024-07-30 04:43:50,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2607/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 3.4644468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:50,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.65792 samples/s/p 1:25:51 } +2024-07-30 04:43:53,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2609/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 3.4611594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:53,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.65787 samples/s/p 1:25:48 } +2024-07-30 04:43:56,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2611/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 3.4578727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:56,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.66001 samples/s/p 1:25:43 } +2024-07-30 04:43:59,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2613/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 3.4545865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:59,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.65974 samples/s/p 1:25:40 } +2024-07-30 04:44:01,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2615/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 3.4513014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:01,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.66110 samples/s/p 1:25:36 } +2024-07-30 04:44:04,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2617/ 3125], loss: 0.123, per_step_time: 1413ms, lr: 3.4480156e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:04,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.65812 samples/s/p 1:25:36 } +2024-07-30 04:44:07,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2619/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 3.444732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:07,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.65808 samples/s/p 1:25:33 } +2024-07-30 04:44:10,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2621/ 3125], loss: 0.879, per_step_time: 1413ms, lr: 3.4414493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:10,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.65863 samples/s/p 1:25:30 } +2024-07-30 04:44:13,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2623/ 3125], loss: 0.192, per_step_time: 1415ms, lr: 3.438167e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:13,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.65130 samples/s/p 1:25:34 } +2024-07-30 04:44:16,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2625/ 3125], loss: 0.056, per_step_time: 1418ms, lr: 3.434885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:16,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.63990 samples/s/p 1:25:41 } +2024-07-30 04:44:18,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2627/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 3.4316042e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:18,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.66026 samples/s/p 1:25:20 } +2024-07-30 04:44:21,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2629/ 3125], loss: 0.289, per_step_time: 1412ms, lr: 3.4283244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:21,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.66212 samples/s/p 1:25:16 } +2024-07-30 04:44:24,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2631/ 3125], loss: 0.300, per_step_time: 1412ms, lr: 3.4250438e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:24,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.66215 samples/s/p 1:25:13 } +2024-07-30 04:44:27,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2633/ 3125], loss: 0.124, per_step_time: 1413ms, lr: 3.4217655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:27,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.65989 samples/s/p 1:25:12 } +2024-07-30 04:44:30,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2635/ 3125], loss: 0.221, per_step_time: 1412ms, lr: 3.4184877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:30,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.66286 samples/s/p 1:25:06 } +2024-07-30 04:44:33,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2637/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 3.4152101e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:33,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.65787 samples/s/p 1:25:08 } +2024-07-30 04:44:35,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2639/ 3125], loss: 0.533, per_step_time: 1413ms, lr: 3.4119344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:35,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.65863 samples/s/p 1:25:05 } +2024-07-30 04:44:38,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2641/ 3125], loss: 0.310, per_step_time: 1415ms, lr: 3.4086588e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:38,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.65361 samples/s/p 1:25:06 } +2024-07-30 04:44:41,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2643/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 3.405384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:41,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.65899 samples/s/p 1:24:59 } +2024-07-30 04:44:44,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2645/ 3125], loss: 0.170, per_step_time: 1412ms, lr: 3.402109e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:44,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.66425 samples/s/p 1:24:51 } +2024-07-30 04:44:47,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2647/ 3125], loss: 0.377, per_step_time: 1413ms, lr: 3.3988356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:47,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.65796 samples/s/p 1:24:54 } +2024-07-30 04:44:50,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2649/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 3.3955628e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:50,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.66005 samples/s/p 1:24:49 } +2024-07-30 04:44:52,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2651/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 3.3922913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:52,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.66005 samples/s/p 1:24:46 } +2024-07-30 04:44:55,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2653/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 3.3890205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:55,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.65976 samples/s/p 1:24:44 } +2024-07-30 04:44:58,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2655/ 3125], loss: 0.244, per_step_time: 1414ms, lr: 3.3857502e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:58,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.65435 samples/s/p 1:24:46 } +2024-07-30 04:45:01,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2657/ 3125], loss: 0.175, per_step_time: 1414ms, lr: 3.3824806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:01,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.65749 samples/s/p 1:24:40 } +2024-07-30 04:45:04,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2659/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 3.3792119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:04,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.65991 samples/s/p 1:24:35 } +2024-07-30 04:45:07,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2661/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 3.3759432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:07,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.65979 samples/s/p 1:24:32 } +2024-07-30 04:45:09,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2663/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 3.3726762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:09,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.65817 samples/s/p 1:24:31 } +2024-07-30 04:45:12,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2665/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 3.36941e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:12,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.65968 samples/s/p 1:24:27 } +2024-07-30 04:45:15,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2667/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 3.3661445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:15,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.65813 samples/s/p 1:24:25 } +2024-07-30 04:45:18,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2669/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 3.3628792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:18,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.65936 samples/s/p 1:24:22 } +2024-07-30 04:45:21,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2671/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 3.3596154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:21,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.65990 samples/s/p 1:24:18 } +2024-07-30 04:45:24,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2673/ 3125], loss: 0.335, per_step_time: 1413ms, lr: 3.3563524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:24,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.66135 samples/s/p 1:24:14 } +2024-07-30 04:45:26,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2675/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 3.353089e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:26,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.66063 samples/s/p 1:24:12 } +2024-07-30 04:45:29,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2677/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 3.3498275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:29,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.65856 samples/s/p 1:24:11 } +2024-07-30 04:45:32,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2679/ 3125], loss: 0.157, per_step_time: 1414ms, lr: 3.3465665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:32,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.65764 samples/s/p 1:24:09 } +2024-07-30 04:45:35,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2681/ 3125], loss: 0.333, per_step_time: 1412ms, lr: 3.3433062e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:35,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.66220 samples/s/p 1:24:02 } +2024-07-30 04:45:38,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2683/ 3125], loss: 0.151, per_step_time: 1413ms, lr: 3.340047e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:38,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.65910 samples/s/p 1:24:02 } +2024-07-30 04:45:41,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2685/ 3125], loss: 0.134, per_step_time: 1415ms, lr: 3.3367887e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:41,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.65345 samples/s/p 1:24:04 } +2024-07-30 04:45:43,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2687/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 3.333531e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:43,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.66120 samples/s/p 1:23:54 } +2024-07-30 04:45:46,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2689/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 3.3302733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:46,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |███████████████████████████████ | 5.66022 samples/s/p 1:23:53 } +2024-07-30 04:45:49,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2691/ 3125], loss: 0.316, per_step_time: 1412ms, lr: 3.3270173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:49,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |███████████████████████████████ | 5.66175 samples/s/p 1:23:48 } +2024-07-30 04:45:52,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2693/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 3.3237618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:52,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.66098 samples/s/p 1:23:46 } +2024-07-30 04:45:55,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2695/ 3125], loss: 0.215, per_step_time: 1416ms, lr: 3.3205074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:55,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.64697 samples/s/p 1:23:56 } +2024-07-30 04:45:58,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2697/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 3.3172535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:58,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.65956 samples/s/p 1:23:42 } +2024-07-30 04:46:00,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2699/ 3125], loss: 0.429, per_step_time: 1413ms, lr: 3.3140009e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:00,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.65979 samples/s/p 1:23:39 } +2024-07-30 04:46:03,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2701/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 3.3107483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:03,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.65927 samples/s/p 1:23:36 } +2024-07-30 04:46:06,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2703/ 3125], loss: 0.354, per_step_time: 1414ms, lr: 3.3074969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:06,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.65759 samples/s/p 1:23:35 } +2024-07-30 04:46:09,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2705/ 3125], loss: 0.235, per_step_time: 1413ms, lr: 3.3042456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:09,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.65842 samples/s/p 1:23:31 } +2024-07-30 04:46:12,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2707/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 3.3009962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:12,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.65853 samples/s/p 1:23:29 } +2024-07-30 04:46:15,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2709/ 3125], loss: 0.192, per_step_time: 1414ms, lr: 3.2977473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:15,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.65424 samples/s/p 1:23:30 } +2024-07-30 04:46:17,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2711/ 3125], loss: 0.232, per_step_time: 1414ms, lr: 3.2944995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:17,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.65488 samples/s/p 1:23:26 } +2024-07-30 04:46:20,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2713/ 3125], loss: 0.175, per_step_time: 1415ms, lr: 3.291252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:20,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.65065 samples/s/p 1:23:27 } +2024-07-30 04:46:23,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2715/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 3.2880055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:23,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.66016 samples/s/p 1:23:16 } +2024-07-30 04:46:26,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2717/ 3125], loss: 0.102, per_step_time: 1413ms, lr: 3.2847588e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:26,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.66110 samples/s/p 1:23:12 } +2024-07-30 04:46:29,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2719/ 3125], loss: 0.109, per_step_time: 1413ms, lr: 3.2815146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:29,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.66051 samples/s/p 1:23:10 } +2024-07-30 04:46:32,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2721/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 3.2782705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:32,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.66082 samples/s/p 1:23:07 } +2024-07-30 04:46:35,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2723/ 3125], loss: 0.164, per_step_time: 1413ms, lr: 3.275028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:35,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.65924 samples/s/p 1:23:05 } +2024-07-30 04:46:37,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2725/ 3125], loss: 0.292, per_step_time: 1413ms, lr: 3.2717846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:37,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.66052 samples/s/p 1:23:01 } +2024-07-30 04:46:40,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2727/ 3125], loss: 0.052, per_step_time: 1413ms, lr: 3.2685434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:40,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.66075 samples/s/p 1:22:58 } +2024-07-30 04:46:43,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2729/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 3.265303e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:43,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.65859 samples/s/p 1:22:57 } +2024-07-30 04:46:46,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2731/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 3.2620633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:46,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.66159 samples/s/p 1:22:52 } +2024-07-30 04:46:49,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2733/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 3.2588234e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:49,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.65977 samples/s/p 1:22:51 } +2024-07-30 04:46:52,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2735/ 3125], loss: 0.177, per_step_time: 1414ms, lr: 3.2555854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:52,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.65730 samples/s/p 1:22:50 } +2024-07-30 04:46:54,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2737/ 3125], loss: 0.227, per_step_time: 1414ms, lr: 3.2523476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:54,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.65743 samples/s/p 1:22:47 } +2024-07-30 04:46:57,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2739/ 3125], loss: 0.217, per_step_time: 1428ms, lr: 3.2491112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:57,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.60035 samples/s/p 1:23:35 } +2024-07-30 04:47:00,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2741/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 3.2458759e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:00,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.66107 samples/s/p 1:22:38 } +2024-07-30 04:47:03,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2743/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 3.242641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:03,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.65791 samples/s/p 1:22:38 } +2024-07-30 04:47:06,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2745/ 3125], loss: 0.425, per_step_time: 1412ms, lr: 3.2394066e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:06,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.66207 samples/s/p 1:22:32 } +2024-07-30 04:47:09,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2747/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 3.236173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:09,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.66012 samples/s/p 1:22:31 } +2024-07-30 04:47:11,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2749/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 3.2329403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:11,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.66105 samples/s/p 1:22:27 } +2024-07-30 04:47:14,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2751/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 3.2297091e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:14,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.66069 samples/s/p 1:22:24 } +2024-07-30 04:47:17,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2753/ 3125], loss: 0.145, per_step_time: 1413ms, lr: 3.2264786e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:17,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.65896 samples/s/p 1:22:23 } +2024-07-30 04:47:20,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2755/ 3125], loss: 0.465, per_step_time: 1413ms, lr: 3.2232485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:20,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.66028 samples/s/p 1:22:19 } +2024-07-30 04:47:23,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2757/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 3.2200196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:23,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.65983 samples/s/p 1:22:17 } +2024-07-30 04:47:26,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2759/ 3125], loss: 0.294, per_step_time: 1413ms, lr: 3.2167916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:26,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.65942 samples/s/p 1:22:14 } +2024-07-30 04:47:28,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2761/ 3125], loss: 0.275, per_step_time: 1414ms, lr: 3.2135636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:28,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.65718 samples/s/p 1:22:13 } +2024-07-30 04:47:31,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2763/ 3125], loss: 0.136, per_step_time: 1414ms, lr: 3.2103371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:31,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.65754 samples/s/p 1:22:10 } +2024-07-30 04:47:34,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2765/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 3.2071118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:34,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.65909 samples/s/p 1:22:06 } +2024-07-30 04:47:37,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2767/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 3.2038872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:37,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.65854 samples/s/p 1:22:04 } +2024-07-30 04:47:40,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2769/ 3125], loss: 0.434, per_step_time: 1413ms, lr: 3.200663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:40,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.66169 samples/s/p 1:21:58 } +2024-07-30 04:47:43,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2771/ 3125], loss: 0.446, per_step_time: 1413ms, lr: 3.1974405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:43,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.65848 samples/s/p 1:21:58 } +2024-07-30 04:47:45,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2773/ 3125], loss: 0.228, per_step_time: 1414ms, lr: 3.1942182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:45,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.65742 samples/s/p 1:21:56 } +2024-07-30 04:47:48,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2775/ 3125], loss: 0.213, per_step_time: 1414ms, lr: 3.190996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:48,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.65739 samples/s/p 1:21:53 } +2024-07-30 04:47:51,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2777/ 3125], loss: 0.291, per_step_time: 1415ms, lr: 3.1877757e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:51,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.65204 samples/s/p 1:21:55 } +2024-07-30 04:47:54,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2779/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 3.1845566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:54,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.66124 samples/s/p 1:21:44 } +2024-07-30 04:47:57,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2781/ 3125], loss: 0.353, per_step_time: 1413ms, lr: 3.1813377e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:57,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.66169 samples/s/p 1:21:41 } +2024-07-30 04:48:00,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2783/ 3125], loss: 0.294, per_step_time: 1413ms, lr: 3.1781199e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:00,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.66168 samples/s/p 1:21:38 } +2024-07-30 04:48:02,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2785/ 3125], loss: 0.113, per_step_time: 1413ms, lr: 3.1749032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:02,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.66035 samples/s/p 1:21:37 } +2024-07-30 04:48:05,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2787/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 3.171687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:05,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.65983 samples/s/p 1:21:34 } +2024-07-30 04:48:08,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2789/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 3.1684717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:08,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.66109 samples/s/p 1:21:30 } +2024-07-30 04:48:11,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2791/ 3125], loss: 0.480, per_step_time: 1413ms, lr: 3.1652569e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:11,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.66000 samples/s/p 1:21:29 } +2024-07-30 04:48:14,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2793/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 3.162043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:14,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.66061 samples/s/p 1:21:25 } +2024-07-30 04:48:17,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2795/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 3.1588309e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:17,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.65944 samples/s/p 1:21:23 } +2024-07-30 04:48:19,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2797/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 3.1556194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:19,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.66089 samples/s/p 1:21:19 } +2024-07-30 04:48:22,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2799/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 3.152409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:22,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.65936 samples/s/p 1:21:18 } +2024-07-30 04:48:25,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2801/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 3.1491986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:25,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.66112 samples/s/p 1:21:13 } +2024-07-30 04:48:28,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2803/ 3125], loss: 0.385, per_step_time: 1414ms, lr: 3.1459897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:28,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.65507 samples/s/p 1:21:16 } +2024-07-30 04:48:31,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2805/ 3125], loss: 0.419, per_step_time: 1412ms, lr: 3.1427805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:31,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.66195 samples/s/p 1:21:07 } +2024-07-30 04:48:34,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2807/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 3.1395732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:34,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.65974 samples/s/p 1:21:06 } +2024-07-30 04:48:36,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2809/ 3125], loss: 0.219, per_step_time: 1414ms, lr: 3.136367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:36,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.65502 samples/s/p 1:21:07 } +2024-07-30 04:48:39,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2811/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 3.133162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:39,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.66045 samples/s/p 1:21:00 } +2024-07-30 04:48:42,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2813/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 3.1299573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:42,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.65871 samples/s/p 1:20:59 } +2024-07-30 04:48:45,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2815/ 3125], loss: 0.597, per_step_time: 1414ms, lr: 3.1267534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:45,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.65770 samples/s/p 1:20:57 } +2024-07-30 04:48:48,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2817/ 3125], loss: 0.322, per_step_time: 1415ms, lr: 3.1235509e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:48,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.65272 samples/s/p 1:20:58 } +2024-07-30 04:48:51,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2819/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 3.1203479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:51,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.65792 samples/s/p 1:20:51 } +2024-07-30 04:48:53,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2821/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 3.1171471e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:53,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.66153 samples/s/p 1:20:45 } +2024-07-30 04:48:56,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2823/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 3.1139475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:56,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.65910 samples/s/p 1:20:44 } +2024-07-30 04:48:59,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2825/ 3125], loss: 0.138, per_step_time: 1412ms, lr: 3.110748e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:59,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.66180 samples/s/p 1:20:39 } +2024-07-30 04:49:02,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2827/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 3.1075494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:02,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.66076 samples/s/p 1:20:37 } +2024-07-30 04:49:05,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2829/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 3.1043523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:05,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.66059 samples/s/p 1:20:34 } +2024-07-30 04:49:08,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2831/ 3125], loss: 0.503, per_step_time: 1413ms, lr: 3.1011564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:08,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.65944 samples/s/p 1:20:32 } +2024-07-30 04:49:10,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2833/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 3.0979597e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:10,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.65798 samples/s/p 1:20:31 } +2024-07-30 04:49:13,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2835/ 3125], loss: 0.214, per_step_time: 1418ms, lr: 3.094765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:13,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.63916 samples/s/p 1:20:44 } +2024-07-30 04:49:16,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2837/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 3.0915708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:16,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.66168 samples/s/p 1:20:22 } +2024-07-30 04:49:19,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2839/ 3125], loss: 0.136, per_step_time: 1413ms, lr: 3.0883782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:19,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.66049 samples/s/p 1:20:20 } +2024-07-30 04:49:22,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2841/ 3125], loss: 0.094, per_step_time: 1412ms, lr: 3.0851863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:22,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.66239 samples/s/p 1:20:16 } +2024-07-30 04:49:25,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2843/ 3125], loss: 0.482, per_step_time: 1416ms, lr: 3.0819954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:25,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.64829 samples/s/p 1:20:25 } +2024-07-30 04:49:27,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2845/ 3125], loss: 0.384, per_step_time: 1415ms, lr: 3.0788058e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:27,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.65048 samples/s/p 1:20:20 } +2024-07-30 04:49:30,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2847/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 3.0756155e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:30,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.65842 samples/s/p 1:20:11 } +2024-07-30 04:49:33,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2849/ 3125], loss: 0.138, per_step_time: 1412ms, lr: 3.0724268e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:33,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.66208 samples/s/p 1:20:05 } +2024-07-30 04:49:36,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2851/ 3125], loss: 0.212, per_step_time: 1414ms, lr: 3.0692397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:36,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.65748 samples/s/p 1:20:06 } +2024-07-30 04:49:39,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2853/ 3125], loss: 0.544, per_step_time: 1413ms, lr: 3.0660533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:39,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.65953 samples/s/p 1:20:01 } +2024-07-30 04:49:42,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2855/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 3.062868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:42,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.66100 samples/s/p 1:19:57 } +2024-07-30 04:49:44,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2857/ 3125], loss: 0.390, per_step_time: 1413ms, lr: 3.0596836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:44,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.66085 samples/s/p 1:19:55 } +2024-07-30 04:49:47,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2859/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 3.0564995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:47,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.66150 samples/s/p 1:19:51 } +2024-07-30 04:49:50,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2861/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 3.053317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:50,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.66011 samples/s/p 1:19:50 } +2024-07-30 04:49:53,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2863/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 3.0501344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:53,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.66081 samples/s/p 1:19:46 } +2024-07-30 04:49:56,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2865/ 3125], loss: 0.275, per_step_time: 1412ms, lr: 3.0469537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:56,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.66214 samples/s/p 1:19:42 } +2024-07-30 04:49:59,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2867/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 3.0437736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:59,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.66045 samples/s/p 1:19:41 } +2024-07-30 04:50:01,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2869/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 3.040595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:01,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.66155 samples/s/p 1:19:37 } +2024-07-30 04:50:04,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2871/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 3.0374165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:04,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |███████████████████████████████ | 5.65938 samples/s/p 1:19:36 } +2024-07-30 04:50:07,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2873/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 3.0342396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:07,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |███████████████████████████████ | 5.65714 samples/s/p 1:19:35 } +2024-07-30 04:50:10,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2875/ 3125], loss: 0.374, per_step_time: 1415ms, lr: 3.0310637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:10,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.65060 samples/s/p 1:19:38 } +2024-07-30 04:50:13,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2877/ 3125], loss: 0.305, per_step_time: 1414ms, lr: 3.0278873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:13,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.65720 samples/s/p 1:19:29 } +2024-07-30 04:50:16,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2879/ 3125], loss: 0.043, per_step_time: 1419ms, lr: 3.0247134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:16,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.63452 samples/s/p 1:19:46 } +2024-07-30 04:50:18,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2881/ 3125], loss: 0.512, per_step_time: 1413ms, lr: 3.02154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:18,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.66055 samples/s/p 1:19:21 } +2024-07-30 04:50:21,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2883/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 3.0183671e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:21,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.66091 samples/s/p 1:19:18 } +2024-07-30 04:50:24,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2885/ 3125], loss: 0.169, per_step_time: 1414ms, lr: 3.015196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:24,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.65765 samples/s/p 1:19:18 } +2024-07-30 04:50:27,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2887/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 3.012026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:27,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.66034 samples/s/p 1:19:13 } +2024-07-30 04:50:30,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2889/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 3.008856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:30,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.66084 samples/s/p 1:19:09 } +2024-07-30 04:50:33,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2891/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 3.0056867e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:33,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.65996 samples/s/p 1:19:07 } +2024-07-30 04:50:35,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2893/ 3125], loss: 0.385, per_step_time: 1412ms, lr: 3.0025187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:35,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.66207 samples/s/p 1:19:03 } +2024-07-30 04:50:38,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2895/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 2.999352e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:38,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.65906 samples/s/p 1:19:02 } +2024-07-30 04:50:41,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2897/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 2.9961866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:41,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.65883 samples/s/p 1:19:00 } +2024-07-30 04:50:44,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2899/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 2.9930218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:44,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.65979 samples/s/p 1:18:56 } +2024-07-30 04:50:47,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2901/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 2.9898583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:47,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.66072 samples/s/p 1:18:52 } +2024-07-30 04:50:50,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2903/ 3125], loss: 0.222, per_step_time: 1414ms, lr: 2.9866949e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:50,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.65717 samples/s/p 1:18:53 } +2024-07-30 04:50:52,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2905/ 3125], loss: 0.322, per_step_time: 1413ms, lr: 2.9835319e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:52,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.66080 samples/s/p 1:18:47 } +2024-07-30 04:50:55,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2907/ 3125], loss: 0.115, per_step_time: 1414ms, lr: 2.980371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:55,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.65556 samples/s/p 1:18:48 } +2024-07-30 04:50:58,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2909/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 2.9772114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:58,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.66028 samples/s/p 1:18:42 } +2024-07-30 04:51:01,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2911/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 2.9740524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:01,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.65965 samples/s/p 1:18:39 } +2024-07-30 04:51:04,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2913/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 2.9708945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:04,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.65805 samples/s/p 1:18:38 } +2024-07-30 04:51:07,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2915/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 2.9677371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:07,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.66149 samples/s/p 1:18:32 } +2024-07-30 04:51:09,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2917/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 2.9645812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:09,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.66018 samples/s/p 1:18:30 } +2024-07-30 04:51:12,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2919/ 3125], loss: 0.264, per_step_time: 1415ms, lr: 2.961425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:12,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.65297 samples/s/p 1:18:33 } +2024-07-30 04:51:15,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2921/ 3125], loss: 0.233, per_step_time: 1414ms, lr: 2.958271e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:15,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.65758 samples/s/p 1:18:27 } +2024-07-30 04:51:18,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2923/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 2.9551177e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:18,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.65959 samples/s/p 1:18:22 } +2024-07-30 04:51:21,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2925/ 3125], loss: 0.236, per_step_time: 1412ms, lr: 2.9519658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:21,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.66234 samples/s/p 1:18:17 } +2024-07-30 04:51:24,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2927/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 2.9488142e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:24,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.66030 samples/s/p 1:18:16 } +2024-07-30 04:51:26,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2929/ 3125], loss: 0.236, per_step_time: 1412ms, lr: 2.9456642e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:26,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.66189 samples/s/p 1:18:12 } +2024-07-30 04:51:29,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2931/ 3125], loss: 0.321, per_step_time: 1413ms, lr: 2.942515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:29,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.65961 samples/s/p 1:18:11 } +2024-07-30 04:51:32,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2933/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 2.9393668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:32,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.65928 samples/s/p 1:18:08 } +2024-07-30 04:51:35,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2935/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 2.9362188e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:35,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.65902 samples/s/p 1:18:06 } +2024-07-30 04:51:38,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2937/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 2.9330724e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:38,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.65971 samples/s/p 1:18:02 } +2024-07-30 04:51:41,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2939/ 3125], loss: 0.116, per_step_time: 1413ms, lr: 2.9299267e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:41,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.66054 samples/s/p 1:17:59 } +2024-07-30 04:51:43,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2941/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 2.9267826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:43,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.65787 samples/s/p 1:17:58 } +2024-07-30 04:51:46,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2943/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 2.9236394e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:46,808 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.65914 samples/s/p 1:17:54 } +2024-07-30 04:51:49,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2945/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 2.920497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:49,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.66158 samples/s/p 1:17:50 } +2024-07-30 04:51:52,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2947/ 3125], loss: 0.207, per_step_time: 1414ms, lr: 2.917356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:52,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.65725 samples/s/p 1:17:50 } +2024-07-30 04:51:55,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2949/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 2.9142147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:55,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.66040 samples/s/p 1:17:45 } +2024-07-30 04:51:58,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2951/ 3125], loss: 0.022, per_step_time: 1413ms, lr: 2.9110752e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:58,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.66065 samples/s/p 1:17:42 } +2024-07-30 04:52:00,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2953/ 3125], loss: 0.267, per_step_time: 1414ms, lr: 2.9079372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:00,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.65717 samples/s/p 1:17:42 } +2024-07-30 04:52:03,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2955/ 3125], loss: 0.157, per_step_time: 1412ms, lr: 2.904799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:03,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.66263 samples/s/p 1:17:35 } +2024-07-30 04:52:06,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2957/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 2.9016626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:06,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.66070 samples/s/p 1:17:33 } +2024-07-30 04:52:09,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2959/ 3125], loss: 0.113, per_step_time: 1413ms, lr: 2.8985273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:09,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.65826 samples/s/p 1:17:33 } +2024-07-30 04:52:12,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2961/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 2.8953932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:12,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.66080 samples/s/p 1:17:28 } +2024-07-30 04:52:15,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2963/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 2.8922586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:15,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.66012 samples/s/p 1:17:25 } +2024-07-30 04:52:17,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2965/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 2.8891266e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:17,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.65998 samples/s/p 1:17:23 } +2024-07-30 04:52:20,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2967/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 2.8859954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:20,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.65836 samples/s/p 1:17:21 } +2024-07-30 04:52:23,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2969/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 2.882865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:23,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.65997 samples/s/p 1:17:17 } +2024-07-30 04:52:26,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2971/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 2.8797358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:26,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.66001 samples/s/p 1:17:14 } +2024-07-30 04:52:29,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2973/ 3125], loss: 0.339, per_step_time: 1414ms, lr: 2.8766076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:29,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.65604 samples/s/p 1:17:15 } +2024-07-30 04:52:32,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2975/ 3125], loss: 0.189, per_step_time: 1414ms, lr: 2.8734794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:32,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.65677 samples/s/p 1:17:11 } +2024-07-30 04:52:34,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2977/ 3125], loss: 0.048, per_step_time: 1415ms, lr: 2.8703535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:34,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.65344 samples/s/p 1:17:11 } +2024-07-30 04:52:37,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2979/ 3125], loss: 0.607, per_step_time: 1414ms, lr: 2.867227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:37,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.65475 samples/s/p 1:17:07 } +2024-07-30 04:52:40,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2981/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 2.864103e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:40,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.66164 samples/s/p 1:16:59 } +2024-07-30 04:52:43,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2983/ 3125], loss: 0.097, per_step_time: 1413ms, lr: 2.86098e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:43,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.66102 samples/s/p 1:16:56 } +2024-07-30 04:52:46,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2985/ 3125], loss: 0.277, per_step_time: 1412ms, lr: 2.857858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:46,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.66240 samples/s/p 1:16:52 } +2024-07-30 04:52:49,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2987/ 3125], loss: 0.051, per_step_time: 1413ms, lr: 2.8547367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:49,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.66106 samples/s/p 1:16:51 } +2024-07-30 04:52:52,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2989/ 3125], loss: 0.155, per_step_time: 1444ms, lr: 2.8516167e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:52,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.53976 samples/s/p 1:18:29 } +2024-07-30 04:52:54,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2991/ 3125], loss: 0.142, per_step_time: 1413ms, lr: 2.8484965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:54,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.66091 samples/s/p 1:16:45 } +2024-07-30 04:52:57,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2993/ 3125], loss: 0.114, per_step_time: 1413ms, lr: 2.8453785e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:57,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.66017 samples/s/p 1:16:43 } +2024-07-30 04:53:00,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2995/ 3125], loss: 0.278, per_step_time: 1415ms, lr: 2.8422617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:00,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.65194 samples/s/p 1:16:47 } +2024-07-30 04:53:03,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2997/ 3125], loss: 0.344, per_step_time: 1413ms, lr: 2.8391455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:03,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.65860 samples/s/p 1:16:39 } +2024-07-30 04:53:06,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2999/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 2.8360298e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:06,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.65814 samples/s/p 1:16:36 } +2024-07-30 04:53:09,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3001/ 3125], loss: 0.242, per_step_time: 1414ms, lr: 2.832916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:09,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.65489 samples/s/p 1:16:36 } +2024-07-30 04:53:11,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3003/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 2.8298032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:11,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.65833 samples/s/p 1:16:30 } +2024-07-30 04:53:14,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3005/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 2.8266911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:14,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.65884 samples/s/p 1:16:27 } +2024-07-30 04:53:17,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3007/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 2.8235793e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:17,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.65862 samples/s/p 1:16:24 } +2024-07-30 04:53:20,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3009/ 3125], loss: 0.139, per_step_time: 1413ms, lr: 2.8204697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:20,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.66150 samples/s/p 1:16:19 } +2024-07-30 04:53:23,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3011/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 2.817361e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:23,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.66093 samples/s/p 1:16:17 } +2024-07-30 04:53:26,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3013/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 2.8142535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:26,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.65931 samples/s/p 1:16:15 } +2024-07-30 04:53:28,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3015/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 2.811147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:28,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.66126 samples/s/p 1:16:11 } +2024-07-30 04:53:31,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3017/ 3125], loss: 0.380, per_step_time: 1419ms, lr: 2.8080415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:31,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.63726 samples/s/p 1:16:28 } +2024-07-30 04:53:34,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3019/ 3125], loss: 0.323, per_step_time: 1413ms, lr: 2.8049358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:34,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.65898 samples/s/p 1:16:07 } +2024-07-30 04:53:37,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3021/ 3125], loss: 0.158, per_step_time: 1413ms, lr: 2.8018326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:37,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.65860 samples/s/p 1:16:05 } +2024-07-30 04:53:40,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3023/ 3125], loss: 0.125, per_step_time: 1413ms, lr: 2.798729e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:40,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.65866 samples/s/p 1:16:02 } +2024-07-30 04:53:43,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3025/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 2.7956276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:43,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.66102 samples/s/p 1:15:57 } +2024-07-30 04:53:45,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3027/ 3125], loss: 0.122, per_step_time: 1414ms, lr: 2.7925273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:45,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.65757 samples/s/p 1:15:57 } +2024-07-30 04:53:48,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3029/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 2.7894282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:48,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.65862 samples/s/p 1:15:53 } +2024-07-30 04:53:51,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3031/ 3125], loss: 0.483, per_step_time: 1414ms, lr: 2.78633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:51,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.65530 samples/s/p 1:15:53 } +2024-07-30 04:53:54,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3033/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 2.783233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:54,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.65982 samples/s/p 1:15:47 } +2024-07-30 04:53:57,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3035/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 2.7801354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:57,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.65840 samples/s/p 1:15:45 } +2024-07-30 04:54:00,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3037/ 3125], loss: 0.364, per_step_time: 1415ms, lr: 2.7770404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:00,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.65252 samples/s/p 1:15:47 } +2024-07-30 04:54:02,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3039/ 3125], loss: 0.401, per_step_time: 1413ms, lr: 2.7739466e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:02,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.66054 samples/s/p 1:15:38 } +2024-07-30 04:54:05,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3041/ 3125], loss: 0.106, per_step_time: 1413ms, lr: 2.7708536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:05,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.65983 samples/s/p 1:15:35 } +2024-07-30 04:54:08,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3043/ 3125], loss: 0.102, per_step_time: 1412ms, lr: 2.7677606e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:08,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.66175 samples/s/p 1:15:31 } +2024-07-30 04:54:11,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3045/ 3125], loss: 0.135, per_step_time: 1412ms, lr: 2.7646702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:11,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.66216 samples/s/p 1:15:28 } +2024-07-30 04:54:14,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3047/ 3125], loss: 0.335, per_step_time: 1413ms, lr: 2.7615804e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:14,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.65955 samples/s/p 1:15:27 } +2024-07-30 04:54:17,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3049/ 3125], loss: 0.182, per_step_time: 1412ms, lr: 2.7584906e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:17,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.66303 samples/s/p 1:15:21 } +2024-07-30 04:54:19,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3051/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 2.755403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:19,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.65986 samples/s/p 1:15:21 } +2024-07-30 04:54:22,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3053/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 2.7523165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:22,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.65977 samples/s/p 1:15:18 } +2024-07-30 04:54:25,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3055/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 2.7492315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:25,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.65920 samples/s/p 1:15:16 } +2024-07-30 04:54:28,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3057/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 2.746147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:28,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.65860 samples/s/p 1:15:14 } +2024-07-30 04:54:31,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3059/ 3125], loss: 0.276, per_step_time: 1412ms, lr: 2.7430635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:31,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |████████████████████████████████ | 5.66251 samples/s/p 1:15:08 } +2024-07-30 04:54:34,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3061/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 2.7399817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:34,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |████████████████████████████████ | 5.65831 samples/s/p 1:15:08 } +2024-07-30 04:54:36,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3063/ 3125], loss: 0.301, per_step_time: 1414ms, lr: 2.7368992e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:36,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.65573 samples/s/p 1:15:07 } +2024-07-30 04:54:39,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3065/ 3125], loss: 0.355, per_step_time: 1414ms, lr: 2.7338194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:39,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.65434 samples/s/p 1:15:06 } +2024-07-30 04:54:42,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3067/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 2.7307394e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:42,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.65816 samples/s/p 1:15:00 } +2024-07-30 04:54:45,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3069/ 3125], loss: 0.339, per_step_time: 1412ms, lr: 2.7276617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:45,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.66210 samples/s/p 1:14:54 } +2024-07-30 04:54:48,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3071/ 3125], loss: 0.504, per_step_time: 1413ms, lr: 2.7245849e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:48,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.65823 samples/s/p 1:14:54 } +2024-07-30 04:54:51,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3073/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 2.7215092e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:51,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.65985 samples/s/p 1:14:50 } +2024-07-30 04:54:53,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3075/ 3125], loss: 0.285, per_step_time: 1412ms, lr: 2.7184346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:53,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.66249 samples/s/p 1:14:45 } +2024-07-30 04:54:56,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3077/ 3125], loss: 0.393, per_step_time: 1413ms, lr: 2.715361e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:56,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.66000 samples/s/p 1:14:44 } +2024-07-30 04:54:59,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3079/ 3125], loss: 0.137, per_step_time: 1414ms, lr: 2.7122876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:59,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.65375 samples/s/p 1:14:46 } +2024-07-30 04:55:02,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3081/ 3125], loss: 0.499, per_step_time: 1413ms, lr: 2.709216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:02,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.66131 samples/s/p 1:14:38 } +2024-07-30 04:55:05,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3083/ 3125], loss: 0.220, per_step_time: 1414ms, lr: 2.7061462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:05,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.65502 samples/s/p 1:14:40 } +2024-07-30 04:55:08,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3085/ 3125], loss: 0.230, per_step_time: 1412ms, lr: 2.7030771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:08,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.66187 samples/s/p 1:14:32 } +2024-07-30 04:55:10,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3087/ 3125], loss: 0.280, per_step_time: 1415ms, lr: 2.7000078e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:10,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.65091 samples/s/p 1:14:37 } +2024-07-30 04:55:13,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3089/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 2.6969408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:13,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.65926 samples/s/p 1:14:28 } +2024-07-30 04:55:16,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3091/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 2.6938749e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:16,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.65969 samples/s/p 1:14:25 } +2024-07-30 04:55:19,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3093/ 3125], loss: 0.408, per_step_time: 1413ms, lr: 2.6908092e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:19,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.65819 samples/s/p 1:14:23 } +2024-07-30 04:55:22,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3095/ 3125], loss: 0.365, per_step_time: 1412ms, lr: 2.6877456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:22,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.66193 samples/s/p 1:14:17 } +2024-07-30 04:55:25,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3097/ 3125], loss: 0.169, per_step_time: 1413ms, lr: 2.684683e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:25,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.66008 samples/s/p 1:14:16 } +2024-07-30 04:55:27,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3099/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 2.6816215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:27,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.66115 samples/s/p 1:14:12 } +2024-07-30 04:55:30,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3101/ 3125], loss: 0.268, per_step_time: 1412ms, lr: 2.678561e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:30,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.66203 samples/s/p 1:14:09 } +2024-07-30 04:55:33,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3103/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 2.6755022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:33,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.65774 samples/s/p 1:14:09 } +2024-07-30 04:55:36,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3105/ 3125], loss: 0.380, per_step_time: 1412ms, lr: 2.672444e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:36,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.66197 samples/s/p 1:14:03 } +2024-07-30 04:55:39,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3107/ 3125], loss: 0.395, per_step_time: 1414ms, lr: 2.6693863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:39,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.65579 samples/s/p 1:14:05 } +2024-07-30 04:55:42,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3109/ 3125], loss: 0.345, per_step_time: 1412ms, lr: 2.6663304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:42,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.66310 samples/s/p 1:13:57 } +2024-07-30 04:55:44,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3111/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 2.6632742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:44,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.66097 samples/s/p 1:13:55 } +2024-07-30 04:55:47,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3113/ 3125], loss: 0.202, per_step_time: 1415ms, lr: 2.6602208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:47,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.65295 samples/s/p 1:13:59 } +2024-07-30 04:55:50,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3115/ 3125], loss: 0.219, per_step_time: 1414ms, lr: 2.6571681e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:50,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.65673 samples/s/p 1:13:53 } +2024-07-30 04:55:53,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3117/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 2.6541168e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:53,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.65874 samples/s/p 1:13:49 } +2024-07-30 04:55:56,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3119/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 2.6510663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:56,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.65902 samples/s/p 1:13:46 } +2024-07-30 04:55:59,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3121/ 3125], loss: 0.329, per_step_time: 1412ms, lr: 2.648016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:59,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.66253 samples/s/p 1:13:40 } +2024-07-30 04:56:01,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3123/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 2.644968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:01,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.65777 samples/s/p 1:13:41 } +2024-07-30 04:56:04,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3125/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 2.641921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:04,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.65998 samples/s/p 1:13:36 } +2024-07-30 04:56:07,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 2.6388755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:07,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.65872 samples/s/p 1:13:35 } +2024-07-30 04:56:10,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 4/ 3125], loss: 0.209, per_step_time: 1414ms, lr: 2.6358305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:10,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.65750 samples/s/p 1:13:33 } +2024-07-30 04:56:13,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 6/ 3125], loss: 0.401, per_step_time: 1414ms, lr: 2.632786e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:13,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.65770 samples/s/p 1:13:30 } +2024-07-30 04:56:16,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 8/ 3125], loss: 0.274, per_step_time: 1412ms, lr: 2.6297437e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:16,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.66179 samples/s/p 1:13:24 } +2024-07-30 04:56:18,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 10/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 2.6267028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:18,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.65572 samples/s/p 1:13:26 } +2024-07-30 04:56:21,807 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 12/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 2.6236612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:21,808 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.65678 samples/s/p 1:13:22 } +2024-07-30 04:56:24,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 14/ 3125], loss: 0.251, per_step_time: 1414ms, lr: 2.6206224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:24,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.65413 samples/s/p 1:13:21 } +2024-07-30 04:56:27,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 16/ 3125], loss: 0.254, per_step_time: 1414ms, lr: 2.6175844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:27,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.65442 samples/s/p 1:13:18 } +2024-07-30 04:56:30,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 18/ 3125], loss: 0.416, per_step_time: 1413ms, lr: 2.6145476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:30,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.66049 samples/s/p 1:13:11 } +2024-07-30 04:56:33,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 20/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 2.6115122e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:33,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.65896 samples/s/p 1:13:09 } +2024-07-30 04:56:35,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 22/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 2.6084776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:35,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.65949 samples/s/p 1:13:06 } +2024-07-30 04:56:38,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 24/ 3125], loss: 0.292, per_step_time: 1413ms, lr: 2.6054445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:38,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.65948 samples/s/p 1:13:03 } +2024-07-30 04:56:41,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 26/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 2.6024115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:41,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.66011 samples/s/p 1:13:00 } +2024-07-30 04:56:44,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 28/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 2.5993802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:44,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.65995 samples/s/p 1:12:57 } +2024-07-30 04:56:47,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 30/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 2.5963493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:47,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.66115 samples/s/p 1:12:53 } +2024-07-30 04:56:50,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 32/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 2.5933205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:50,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.66020 samples/s/p 1:12:51 } +2024-07-30 04:56:52,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 34/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 2.5902932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:52,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.66094 samples/s/p 1:12:48 } +2024-07-30 04:56:55,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 36/ 3125], loss: 0.366, per_step_time: 1412ms, lr: 2.5872669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:55,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.66220 samples/s/p 1:12:44 } +2024-07-30 04:56:58,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 38/ 3125], loss: 0.348, per_step_time: 1413ms, lr: 2.5842417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:58,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.65999 samples/s/p 1:12:43 } +2024-07-30 04:57:01,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 40/ 3125], loss: 0.229, per_step_time: 1412ms, lr: 2.581216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:01,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.66256 samples/s/p 1:12:38 } +2024-07-30 04:57:04,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 42/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 2.5781935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:04,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.65971 samples/s/p 1:12:37 } +2024-07-30 04:57:07,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 44/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 2.5751715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:07,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.66141 samples/s/p 1:12:33 } +2024-07-30 04:57:09,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 46/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 2.5721508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:09,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.66122 samples/s/p 1:12:31 } +2024-07-30 04:57:12,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 48/ 3125], loss: 0.220, per_step_time: 1414ms, lr: 2.569131e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:12,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.65725 samples/s/p 1:12:31 } +2024-07-30 04:57:15,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 50/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 2.5661127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:15,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.66049 samples/s/p 1:12:25 } +2024-07-30 04:57:18,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 52/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 2.5630948e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:18,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.66084 samples/s/p 1:12:22 } +2024-07-30 04:57:21,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 54/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 2.5600777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:21,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.66084 samples/s/p 1:12:19 } +2024-07-30 04:57:24,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 56/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 2.557063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:24,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.66062 samples/s/p 1:12:17 } +2024-07-30 04:57:26,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 58/ 3125], loss: 0.320, per_step_time: 1413ms, lr: 2.5540494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:26,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.65959 samples/s/p 1:12:15 } +2024-07-30 04:57:29,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 60/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 2.5510367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:29,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.65939 samples/s/p 1:12:12 } +2024-07-30 04:57:32,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 62/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 2.5480251e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:32,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.65908 samples/s/p 1:12:10 } +2024-07-30 04:57:35,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 64/ 3125], loss: 0.206, per_step_time: 1412ms, lr: 2.5450151e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:35,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.66200 samples/s/p 1:12:04 } +2024-07-30 04:57:38,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 66/ 3125], loss: 0.249, per_step_time: 1414ms, lr: 2.5420063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:38,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.65737 samples/s/p 1:12:05 } +2024-07-30 04:57:41,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 68/ 3125], loss: 0.364, per_step_time: 1412ms, lr: 2.5389975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:41,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.66185 samples/s/p 1:11:59 } +2024-07-30 04:57:43,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 70/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 2.5359905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:43,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.66139 samples/s/p 1:11:56 } +2024-07-30 04:57:46,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 72/ 3125], loss: 0.413, per_step_time: 1414ms, lr: 2.532985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:46,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.65643 samples/s/p 1:11:57 } +2024-07-30 04:57:49,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 74/ 3125], loss: 0.082, per_step_time: 1413ms, lr: 2.529981e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:49,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.65925 samples/s/p 1:11:52 } +2024-07-30 04:57:52,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 76/ 3125], loss: 0.412, per_step_time: 1413ms, lr: 2.5269765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:52,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.65801 samples/s/p 1:11:51 } +2024-07-30 04:57:55,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 78/ 3125], loss: 0.093, per_step_time: 1414ms, lr: 2.5239747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:55,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.65755 samples/s/p 1:11:48 } +2024-07-30 04:57:58,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 80/ 3125], loss: 0.102, per_step_time: 1412ms, lr: 2.5209742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:58,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.66179 samples/s/p 1:11:42 } +2024-07-30 04:58:00,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 82/ 3125], loss: 0.208, per_step_time: 1414ms, lr: 2.5179743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:00,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.65418 samples/s/p 1:11:45 } +2024-07-30 04:58:03,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 84/ 3125], loss: 0.203, per_step_time: 1412ms, lr: 2.514975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:03,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.66307 samples/s/p 1:11:35 } +2024-07-30 04:58:06,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 86/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 2.5119778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:06,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.66169 samples/s/p 1:11:34 } +2024-07-30 04:58:09,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 88/ 3125], loss: 0.132, per_step_time: 1414ms, lr: 2.5089817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:09,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.65537 samples/s/p 1:11:36 } +2024-07-30 04:58:12,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 90/ 3125], loss: 0.296, per_step_time: 1414ms, lr: 2.505987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:12,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.65436 samples/s/p 1:11:34 } +2024-07-30 04:58:15,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 92/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 2.5029933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:15,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.66168 samples/s/p 1:11:25 } +2024-07-30 04:58:18,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 94/ 3125], loss: 0.059, per_step_time: 1413ms, lr: 2.5000008e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:18,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.65829 samples/s/p 1:11:25 } +2024-07-30 04:58:20,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 96/ 3125], loss: 0.201, per_step_time: 1414ms, lr: 2.4970086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:20,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.65515 samples/s/p 1:11:24 } +2024-07-30 04:58:23,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 98/ 3125], loss: 0.089, per_step_time: 1413ms, lr: 2.4940175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:23,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.66113 samples/s/p 1:11:17 } +2024-07-30 04:58:26,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 100/ 3125], loss: 0.347, per_step_time: 1412ms, lr: 2.4910285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:26,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.66216 samples/s/p 1:11:13 } +2024-07-30 04:58:29,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 102/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 2.4880408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:29,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.66070 samples/s/p 1:11:12 } +2024-07-30 04:58:32,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 104/ 3125], loss: 0.186, per_step_time: 1414ms, lr: 2.4850544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:32,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.65597 samples/s/p 1:11:13 } +2024-07-30 04:58:35,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 106/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 2.4820695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:35,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.65795 samples/s/p 1:11:08 } +2024-07-30 04:58:37,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 108/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 2.4790852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:37,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.65903 samples/s/p 1:11:05 } +2024-07-30 04:58:40,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 110/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 2.4761023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:40,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.66098 samples/s/p 1:11:00 } +2024-07-30 04:58:43,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 112/ 3125], loss: 0.174, per_step_time: 1414ms, lr: 2.4731198e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:43,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.65742 samples/s/p 1:11:00 } +2024-07-30 04:58:46,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 114/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 2.4701392e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:46,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.65998 samples/s/p 1:10:55 } +2024-07-30 04:58:49,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 116/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 2.46716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:49,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.66074 samples/s/p 1:10:52 } +2024-07-30 04:58:52,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 118/ 3125], loss: 0.344, per_step_time: 1413ms, lr: 2.464182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:52,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.66004 samples/s/p 1:10:50 } +2024-07-30 04:58:54,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 120/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 2.461204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:54,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.66114 samples/s/p 1:10:46 } +2024-07-30 04:58:57,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 122/ 3125], loss: 0.334, per_step_time: 1413ms, lr: 2.4582287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:57,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |█████████████████████████████████ | 5.66055 samples/s/p 1:10:44 } +2024-07-30 04:59:00,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 124/ 3125], loss: 0.114, per_step_time: 1413ms, lr: 2.4552542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:00,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |█████████████████████████████████ | 5.65932 samples/s/p 1:10:42 } +2024-07-30 04:59:03,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 126/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 2.45228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:03,347 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.65860 samples/s/p 1:10:39 } +2024-07-30 04:59:06,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 128/ 3125], loss: 0.396, per_step_time: 1413ms, lr: 2.4493079e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:06,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.65813 samples/s/p 1:10:37 } +2024-07-30 04:59:09,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 130/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 2.4463372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:09,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.66064 samples/s/p 1:10:32 } +2024-07-30 04:59:11,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 132/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 2.4433677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:11,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.66053 samples/s/p 1:10:29 } +2024-07-30 04:59:14,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 134/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 2.4403994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:14,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.65922 samples/s/p 1:10:28 } +2024-07-30 04:59:17,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 136/ 3125], loss: 0.170, per_step_time: 1412ms, lr: 2.4374324e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:17,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.66192 samples/s/p 1:10:23 } +2024-07-30 04:59:20,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 138/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 2.4344665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:20,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.65849 samples/s/p 1:10:23 } +2024-07-30 04:59:23,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 140/ 3125], loss: 0.139, per_step_time: 1414ms, lr: 2.431501e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:23,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.65603 samples/s/p 1:10:22 } +2024-07-30 04:59:26,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 142/ 3125], loss: 0.400, per_step_time: 1413ms, lr: 2.4285375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:26,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.66108 samples/s/p 1:10:15 } +2024-07-30 04:59:28,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 144/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 2.4255744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:28,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.66138 samples/s/p 1:10:12 } +2024-07-30 04:59:31,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 146/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 2.422613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:31,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.66051 samples/s/p 1:10:10 } +2024-07-30 04:59:34,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 148/ 3125], loss: 0.408, per_step_time: 1414ms, lr: 2.4196536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:34,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.65480 samples/s/p 1:10:11 } +2024-07-30 04:59:37,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 150/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 2.416695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:37,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.65827 samples/s/p 1:10:06 } +2024-07-30 04:59:40,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 152/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 2.413738e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:40,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.66130 samples/s/p 1:10:01 } +2024-07-30 04:59:43,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 154/ 3125], loss: 0.100, per_step_time: 1413ms, lr: 2.410782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:43,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.65799 samples/s/p 1:10:00 } +2024-07-30 04:59:45,858 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 156/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 2.407826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:45,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.66092 samples/s/p 1:09:55 } +2024-07-30 04:59:48,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 158/ 3125], loss: 0.271, per_step_time: 1419ms, lr: 2.4048725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:48,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.63651 samples/s/p 1:10:11 } +2024-07-30 04:59:51,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 160/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 2.4019203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:51,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.66086 samples/s/p 1:09:50 } +2024-07-30 04:59:54,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 162/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 2.3989692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:54,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.65905 samples/s/p 1:09:48 } +2024-07-30 04:59:57,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 164/ 3125], loss: 0.320, per_step_time: 1413ms, lr: 2.396018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:57,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.66112 samples/s/p 1:09:44 } +2024-07-30 05:00:00,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 166/ 3125], loss: 0.197, per_step_time: 1413ms, lr: 2.3930697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:00,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.65821 samples/s/p 1:09:43 } +2024-07-30 05:00:02,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 168/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 2.3901223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:02,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.65780 samples/s/p 1:09:41 } +2024-07-30 05:00:05,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 170/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 2.3871753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:05,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.66109 samples/s/p 1:09:35 } +2024-07-30 05:00:08,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 172/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 2.3842304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:08,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.66116 samples/s/p 1:09:32 } +2024-07-30 05:00:11,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 174/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 2.3812868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:11,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.66016 samples/s/p 1:09:30 } +2024-07-30 05:00:14,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 176/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 2.3783446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:14,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.65872 samples/s/p 1:09:29 } +2024-07-30 05:00:17,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 178/ 3125], loss: 0.348, per_step_time: 1414ms, lr: 2.3754033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:17,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.65678 samples/s/p 1:09:27 } +2024-07-30 05:00:19,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 180/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 2.3724635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:19,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.65787 samples/s/p 1:09:24 } +2024-07-30 05:00:22,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 182/ 3125], loss: 0.320, per_step_time: 1414ms, lr: 2.369525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:22,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.65716 samples/s/p 1:09:21 } +2024-07-30 05:00:25,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 184/ 3125], loss: 0.459, per_step_time: 1414ms, lr: 2.3665866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:25,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.65672 samples/s/p 1:09:19 } +2024-07-30 05:00:28,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 186/ 3125], loss: 0.228, per_step_time: 1414ms, lr: 2.3636508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:28,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.65704 samples/s/p 1:09:16 } +2024-07-30 05:00:31,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 188/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 2.360715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:31,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.66099 samples/s/p 1:09:10 } +2024-07-30 05:00:34,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 190/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 2.357781e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:34,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.66145 samples/s/p 1:09:07 } +2024-07-30 05:00:36,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 192/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 2.354849e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:36,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.66057 samples/s/p 1:09:05 } +2024-07-30 05:00:39,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 194/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 2.3519178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:39,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.65837 samples/s/p 1:09:03 } +2024-07-30 05:00:42,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 196/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 2.348988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:42,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.66081 samples/s/p 1:08:59 } +2024-07-30 05:00:45,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 198/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 2.3460586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:45,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.66148 samples/s/p 1:08:56 } +2024-07-30 05:00:48,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 200/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 2.3431312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:48,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.66074 samples/s/p 1:08:53 } +2024-07-30 05:00:51,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 202/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 2.3402056e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:51,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.65917 samples/s/p 1:08:52 } +2024-07-30 05:00:53,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 204/ 3125], loss: 0.330, per_step_time: 1413ms, lr: 2.3372806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:53,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.65975 samples/s/p 1:08:48 } +2024-07-30 05:00:56,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 206/ 3125], loss: 0.396, per_step_time: 1413ms, lr: 2.3343575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:56,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.66103 samples/s/p 1:08:45 } +2024-07-30 05:00:59,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 208/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 2.3314344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:59,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.66116 samples/s/p 1:08:42 } +2024-07-30 05:01:02,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 210/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 2.3285136e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:02,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.66140 samples/s/p 1:08:39 } +2024-07-30 05:01:05,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 212/ 3125], loss: 0.287, per_step_time: 1418ms, lr: 2.3255939e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:05,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.63966 samples/s/p 1:08:52 } +2024-07-30 05:01:08,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 214/ 3125], loss: 0.473, per_step_time: 1413ms, lr: 2.3226744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:08,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.65946 samples/s/p 1:08:34 } +2024-07-30 05:01:10,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 216/ 3125], loss: 0.241, per_step_time: 1414ms, lr: 2.3197572e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:10,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.65396 samples/s/p 1:08:36 } +2024-07-30 05:01:13,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 218/ 3125], loss: 0.399, per_step_time: 1416ms, lr: 2.3168413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:13,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.64629 samples/s/p 1:08:38 } +2024-07-30 05:01:16,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 220/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 2.313927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:16,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.65948 samples/s/p 1:08:26 } +2024-07-30 05:01:19,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 222/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 2.311014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:19,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.65921 samples/s/p 1:08:23 } +2024-07-30 05:01:22,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 224/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 2.3081018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:22,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.66156 samples/s/p 1:08:19 } +2024-07-30 05:01:25,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 226/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 2.3051914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:25,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.66108 samples/s/p 1:08:16 } +2024-07-30 05:01:27,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 228/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 2.3022812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:27,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.66119 samples/s/p 1:08:13 } +2024-07-30 05:01:30,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 230/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 2.2993727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:30,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.66033 samples/s/p 1:08:11 } +2024-07-30 05:01:33,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 232/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 2.2964653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:33,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.66135 samples/s/p 1:08:08 } +2024-07-30 05:01:36,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 234/ 3125], loss: 0.231, per_step_time: 1414ms, lr: 2.2935599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:36,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.65570 samples/s/p 1:08:09 } +2024-07-30 05:01:39,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 236/ 3125], loss: 0.349, per_step_time: 1413ms, lr: 2.2906556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:39,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.66072 samples/s/p 1:08:02 } +2024-07-30 05:01:42,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 238/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 2.287753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:42,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.65864 samples/s/p 1:08:01 } +2024-07-30 05:01:44,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 240/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 2.284851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:44,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.66134 samples/s/p 1:07:56 } +2024-07-30 05:01:47,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 242/ 3125], loss: 0.152, per_step_time: 1414ms, lr: 2.2819497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:47,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.65469 samples/s/p 1:07:58 } +2024-07-30 05:01:50,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 244/ 3125], loss: 0.308, per_step_time: 1414ms, lr: 2.279051e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:50,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.65716 samples/s/p 1:07:54 } +2024-07-30 05:01:53,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 246/ 3125], loss: 0.103, per_step_time: 1413ms, lr: 2.2761533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:53,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.66058 samples/s/p 1:07:48 } +2024-07-30 05:01:56,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 248/ 3125], loss: 0.120, per_step_time: 1414ms, lr: 2.2732568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:56,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.65576 samples/s/p 1:07:49 } +2024-07-30 05:01:59,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 250/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 2.2703616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:59,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.66029 samples/s/p 1:07:43 } +2024-07-30 05:02:01,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 252/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 2.2674667e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:01,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.66028 samples/s/p 1:07:40 } +2024-07-30 05:02:04,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 254/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 2.2645745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:04,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.65931 samples/s/p 1:07:38 } +2024-07-30 05:02:07,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 256/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 2.261682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:07,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.66060 samples/s/p 1:07:34 } +2024-07-30 05:02:10,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 258/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 2.2587922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:10,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.65970 samples/s/p 1:07:32 } +2024-07-30 05:02:13,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 260/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 2.2559038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:13,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.66150 samples/s/p 1:07:28 } +2024-07-30 05:02:16,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 262/ 3125], loss: 0.442, per_step_time: 1415ms, lr: 2.2530164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:16,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.65324 samples/s/p 1:07:31 } +2024-07-30 05:02:18,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 264/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 2.2501304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:18,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.65853 samples/s/p 1:07:24 } +2024-07-30 05:02:21,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 266/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 2.247246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:21,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.66060 samples/s/p 1:07:20 } +2024-07-30 05:02:24,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 268/ 3125], loss: 0.131, per_step_time: 1414ms, lr: 2.2443626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:24,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.65726 samples/s/p 1:07:20 } +2024-07-30 05:02:27,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 270/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 2.2414795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:27,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.65984 samples/s/p 1:07:15 } +2024-07-30 05:02:30,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 272/ 3125], loss: 0.448, per_step_time: 1413ms, lr: 2.2385987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:30,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.65969 samples/s/p 1:07:12 } +2024-07-30 05:02:33,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 274/ 3125], loss: 0.139, per_step_time: 1413ms, lr: 2.2357194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:33,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.66099 samples/s/p 1:07:08 } +2024-07-30 05:02:35,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 276/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 2.2328406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:35,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.66102 samples/s/p 1:07:06 } +2024-07-30 05:02:38,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 278/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 2.2299637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:38,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.65944 samples/s/p 1:07:04 } +2024-07-30 05:02:41,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 280/ 3125], loss: 0.103, per_step_time: 1412ms, lr: 2.2270885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:41,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.66349 samples/s/p 1:06:58 } +2024-07-30 05:02:44,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 282/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 2.2242143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:44,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.65818 samples/s/p 1:06:59 } +2024-07-30 05:02:47,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 284/ 3125], loss: 0.123, per_step_time: 1413ms, lr: 2.2213417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:47,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.66034 samples/s/p 1:06:55 } +2024-07-30 05:02:50,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 286/ 3125], loss: 0.452, per_step_time: 1413ms, lr: 2.218469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:50,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.66004 samples/s/p 1:06:52 } +2024-07-30 05:02:52,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 288/ 3125], loss: 0.184, per_step_time: 1412ms, lr: 2.2155987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:52,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.66173 samples/s/p 1:06:48 } +2024-07-30 05:02:55,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 290/ 3125], loss: 0.319, per_step_time: 1414ms, lr: 2.21273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:55,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.65400 samples/s/p 1:06:51 } +2024-07-30 05:02:58,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 292/ 3125], loss: 0.234, per_step_time: 1414ms, lr: 2.2098627e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:58,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.65645 samples/s/p 1:06:46 } +2024-07-30 05:03:01,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 294/ 3125], loss: 0.413, per_step_time: 1412ms, lr: 2.2069967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:01,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.66239 samples/s/p 1:06:39 } +2024-07-30 05:03:04,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 296/ 3125], loss: 0.140, per_step_time: 1412ms, lr: 2.2041309e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:04,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.66306 samples/s/p 1:06:36 } +2024-07-30 05:03:07,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 298/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 2.2012675e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:07,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.65850 samples/s/p 1:06:36 } +2024-07-30 05:03:09,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 300/ 3125], loss: 0.222, per_step_time: 1412ms, lr: 2.1984042e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:09,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.66237 samples/s/p 1:06:31 } +2024-07-30 05:03:12,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 302/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 2.1955436e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:12,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.66063 samples/s/p 1:06:29 } +2024-07-30 05:03:15,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 304/ 3125], loss: 0.106, per_step_time: 1413ms, lr: 2.192684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:15,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.65955 samples/s/p 1:06:27 } +2024-07-30 05:03:18,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 306/ 3125], loss: 0.305, per_step_time: 1416ms, lr: 2.189826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:18,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.64767 samples/s/p 1:06:33 } +2024-07-30 05:03:21,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 308/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 2.1869691e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:21,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.66110 samples/s/p 1:06:20 } +2024-07-30 05:03:24,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 310/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 2.1841138e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:24,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.66131 samples/s/p 1:06:17 } +2024-07-30 05:03:26,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 312/ 3125], loss: 0.106, per_step_time: 1414ms, lr: 2.18126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:26,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.65726 samples/s/p 1:06:17 } +2024-07-30 05:03:29,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 314/ 3125], loss: 0.510, per_step_time: 1414ms, lr: 2.178406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:29,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |███████████████████████████████████ | 5.65609 samples/s/p 1:06:15 } +2024-07-30 05:03:32,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 316/ 3125], loss: 0.227, per_step_time: 1414ms, lr: 2.175555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:32,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |███████████████████████████████████ | 5.65758 samples/s/p 1:06:12 } +2024-07-30 05:03:35,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 318/ 3125], loss: 0.397, per_step_time: 1413ms, lr: 2.1727046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:35,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.66016 samples/s/p 1:06:07 } +2024-07-30 05:03:38,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 320/ 3125], loss: 0.451, per_step_time: 1412ms, lr: 2.1698552e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:38,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.66254 samples/s/p 1:06:02 } +2024-07-30 05:03:41,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 322/ 3125], loss: 0.272, per_step_time: 1414ms, lr: 2.1670078e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:41,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.65555 samples/s/p 1:06:04 } +2024-07-30 05:03:43,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 324/ 3125], loss: 0.444, per_step_time: 1413ms, lr: 2.1641617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:43,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.65940 samples/s/p 1:05:59 } +2024-07-30 05:03:46,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 326/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 2.161317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:46,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.65977 samples/s/p 1:05:56 } +2024-07-30 05:03:49,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 328/ 3125], loss: 0.163, per_step_time: 1412ms, lr: 2.158473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:49,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.66172 samples/s/p 1:05:52 } +2024-07-30 05:03:52,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 330/ 3125], loss: 0.258, per_step_time: 1412ms, lr: 2.1556311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:52,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.66368 samples/s/p 1:05:47 } +2024-07-30 05:03:55,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 332/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 2.1527903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:55,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.66101 samples/s/p 1:05:46 } +2024-07-30 05:03:58,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 334/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 2.1499513e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:58,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.65990 samples/s/p 1:05:44 } +2024-07-30 05:04:00,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 336/ 3125], loss: 0.485, per_step_time: 1413ms, lr: 2.1471137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:00,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.66102 samples/s/p 1:05:41 } +2024-07-30 05:04:03,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 338/ 3125], loss: 0.426, per_step_time: 1413ms, lr: 2.144277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:03,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.65823 samples/s/p 1:05:40 } +2024-07-30 05:04:06,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 340/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 2.141441e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:06,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.65943 samples/s/p 1:05:36 } +2024-07-30 05:04:09,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 342/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 2.1386072e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:09,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.66170 samples/s/p 1:05:32 } +2024-07-30 05:04:12,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 344/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 2.135774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:12,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.65881 samples/s/p 1:05:31 } +2024-07-30 05:04:15,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 346/ 3125], loss: 0.262, per_step_time: 1414ms, lr: 2.1329429e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:15,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.65602 samples/s/p 1:05:30 } +2024-07-30 05:04:17,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 348/ 3125], loss: 0.314, per_step_time: 1414ms, lr: 2.1301134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:17,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.65651 samples/s/p 1:05:27 } +2024-07-30 05:04:20,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 350/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 2.127285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:20,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.65783 samples/s/p 1:05:23 } +2024-07-30 05:04:23,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 352/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 2.1244582e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:23,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.66138 samples/s/p 1:05:18 } +2024-07-30 05:04:26,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 354/ 3125], loss: 0.058, per_step_time: 1413ms, lr: 2.1216326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:26,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.66003 samples/s/p 1:05:16 } +2024-07-30 05:04:29,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 356/ 3125], loss: 0.377, per_step_time: 1413ms, lr: 2.1188087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:29,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.66045 samples/s/p 1:05:13 } +2024-07-30 05:04:32,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 358/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 2.115985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:32,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.65987 samples/s/p 1:05:11 } +2024-07-30 05:04:34,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 360/ 3125], loss: 0.197, per_step_time: 1413ms, lr: 2.1131634e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:34,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.65853 samples/s/p 1:05:09 } +2024-07-30 05:04:37,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 362/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 2.1103435e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:37,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.65894 samples/s/p 1:05:06 } +2024-07-30 05:04:40,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 364/ 3125], loss: 0.402, per_step_time: 1425ms, lr: 2.1075239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:40,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.61082 samples/s/p 1:05:36 } +2024-07-30 05:04:43,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 366/ 3125], loss: 0.134, per_step_time: 1412ms, lr: 2.1047065e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:43,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.66261 samples/s/p 1:04:57 } +2024-07-30 05:04:46,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 368/ 3125], loss: 0.405, per_step_time: 1413ms, lr: 2.1018907e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:46,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.66044 samples/s/p 1:04:56 } +2024-07-30 05:04:49,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 370/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 2.0990763e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:49,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.66050 samples/s/p 1:04:53 } +2024-07-30 05:04:51,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 372/ 3125], loss: 0.299, per_step_time: 1412ms, lr: 2.0962623e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:51,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.66240 samples/s/p 1:04:49 } +2024-07-30 05:04:54,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 374/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 2.0934503e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:54,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.65981 samples/s/p 1:04:48 } +2024-07-30 05:04:57,660 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 376/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 2.09064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:57,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.66045 samples/s/p 1:04:45 } +2024-07-30 05:05:00,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 378/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 2.087831e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:00,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.66018 samples/s/p 1:04:42 } +2024-07-30 05:05:03,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 380/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 2.0850239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:03,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.65828 samples/s/p 1:04:41 } +2024-07-30 05:05:06,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 382/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 2.0822176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:06,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.65911 samples/s/p 1:04:37 } +2024-07-30 05:05:08,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 384/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 2.079413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:08,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.66039 samples/s/p 1:04:33 } +2024-07-30 05:05:11,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 386/ 3125], loss: 0.325, per_step_time: 1414ms, lr: 2.076608e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:11,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.65749 samples/s/p 1:04:33 } +2024-07-30 05:05:14,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 388/ 3125], loss: 0.174, per_step_time: 1414ms, lr: 2.0738055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:14,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.65764 samples/s/p 1:04:30 } +2024-07-30 05:05:17,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 390/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 2.0710047e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:17,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.66060 samples/s/p 1:04:25 } +2024-07-30 05:05:20,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 392/ 3125], loss: 0.240, per_step_time: 1414ms, lr: 2.0682057e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:20,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.65551 samples/s/p 1:04:25 } +2024-07-30 05:05:23,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 394/ 3125], loss: 0.306, per_step_time: 1415ms, lr: 2.065408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:23,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.65009 samples/s/p 1:04:26 } +2024-07-30 05:05:26,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 396/ 3125], loss: 0.127, per_step_time: 1413ms, lr: 2.0626114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:26,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.65786 samples/s/p 1:04:18 } +2024-07-30 05:05:28,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 398/ 3125], loss: 0.328, per_step_time: 1414ms, lr: 2.0598168e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:28,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.65704 samples/s/p 1:04:16 } +2024-07-30 05:05:31,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 400/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 2.0570221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:31,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.66048 samples/s/p 1:04:11 } +2024-07-30 05:05:34,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 402/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 2.05423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:34,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.66110 samples/s/p 1:04:08 } +2024-07-30 05:05:37,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 404/ 3125], loss: 0.255, per_step_time: 1412ms, lr: 2.051439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:37,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.66253 samples/s/p 1:04:04 } +2024-07-30 05:05:40,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 406/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 2.0486498e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:40,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.66161 samples/s/p 1:04:02 } +2024-07-30 05:05:43,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 408/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 2.0458617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:43,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.66149 samples/s/p 1:03:59 } +2024-07-30 05:05:45,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 410/ 3125], loss: 0.260, per_step_time: 1412ms, lr: 2.0430743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:45,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.66205 samples/s/p 1:03:56 } +2024-07-30 05:05:48,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 412/ 3125], loss: 0.390, per_step_time: 1414ms, lr: 2.0402892e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:48,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.65439 samples/s/p 1:03:58 } +2024-07-30 05:05:51,513 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 414/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 2.0375046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:51,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.66033 samples/s/p 1:03:51 } +2024-07-30 05:05:54,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 416/ 3125], loss: 0.178, per_step_time: 1412ms, lr: 2.0347222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:54,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.66178 samples/s/p 1:03:47 } +2024-07-30 05:05:57,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 418/ 3125], loss: 0.521, per_step_time: 1414ms, lr: 2.0319414e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:57,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.65755 samples/s/p 1:03:47 } +2024-07-30 05:06:00,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 420/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 2.029162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:00,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.66091 samples/s/p 1:03:42 } +2024-07-30 05:06:02,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 422/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 2.0263842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:02,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.66007 samples/s/p 1:03:40 } +2024-07-30 05:06:05,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 424/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 2.023607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:05,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.65844 samples/s/p 1:03:38 } +2024-07-30 05:06:08,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 426/ 3125], loss: 0.164, per_step_time: 1413ms, lr: 2.0208322e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:08,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.66032 samples/s/p 1:03:34 } +2024-07-30 05:06:11,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 428/ 3125], loss: 0.118, per_step_time: 1413ms, lr: 2.0180582e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:11,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.65883 samples/s/p 1:03:32 } +2024-07-30 05:06:14,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 430/ 3125], loss: 0.393, per_step_time: 1414ms, lr: 2.0152852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:14,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.65637 samples/s/p 1:03:31 } +2024-07-30 05:06:17,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 432/ 3125], loss: 0.254, per_step_time: 1415ms, lr: 2.0125142e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:17,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.65252 samples/s/p 1:03:31 } +2024-07-30 05:06:19,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 434/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 2.0097436e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:19,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.66054 samples/s/p 1:03:23 } +2024-07-30 05:06:22,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 436/ 3125], loss: 0.236, per_step_time: 1412ms, lr: 2.0069756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:22,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.66250 samples/s/p 1:03:19 } +2024-07-30 05:06:25,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 438/ 3125], loss: 0.169, per_step_time: 1413ms, lr: 2.0042091e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:25,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.66097 samples/s/p 1:03:17 } +2024-07-30 05:06:28,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 440/ 3125], loss: 0.332, per_step_time: 1414ms, lr: 2.0014438e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:28,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.65757 samples/s/p 1:03:16 } +2024-07-30 05:06:31,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 442/ 3125], loss: 0.359, per_step_time: 1414ms, lr: 1.9986799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:31,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.65535 samples/s/p 1:03:15 } +2024-07-30 05:06:34,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 444/ 3125], loss: 0.249, per_step_time: 1414ms, lr: 1.9959166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:34,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.65752 samples/s/p 1:03:11 } +2024-07-30 05:06:36,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 446/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 1.9931558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:36,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.65978 samples/s/p 1:03:06 } +2024-07-30 05:06:39,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 448/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 1.9903964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:39,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.65973 samples/s/p 1:03:03 } +2024-07-30 05:06:42,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 450/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 1.9876384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:42,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.66116 samples/s/p 1:03:00 } +2024-07-30 05:06:45,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 452/ 3125], loss: 0.185, per_step_time: 1412ms, lr: 1.9848817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:45,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.66249 samples/s/p 1:02:56 } +2024-07-30 05:06:48,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 454/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 1.9821257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:48,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.66015 samples/s/p 1:02:55 } +2024-07-30 05:06:51,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 456/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 1.9793717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:51,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.66068 samples/s/p 1:02:51 } +2024-07-30 05:06:53,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 458/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 1.9766185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:53,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.65887 samples/s/p 1:02:50 } +2024-07-30 05:06:56,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 460/ 3125], loss: 0.338, per_step_time: 1415ms, lr: 1.9738677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:56,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.65193 samples/s/p 1:02:52 } +2024-07-30 05:06:59,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 462/ 3125], loss: 0.385, per_step_time: 1414ms, lr: 1.9711183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:59,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.65754 samples/s/p 1:02:45 } +2024-07-30 05:07:02,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 464/ 3125], loss: 0.441, per_step_time: 1413ms, lr: 1.9683703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:02,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.65948 samples/s/p 1:02:41 } +2024-07-30 05:07:05,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 466/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 1.965624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:05,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.65796 samples/s/p 1:02:39 } +2024-07-30 05:07:08,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 468/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 1.962879e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:08,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.65926 samples/s/p 1:02:35 } +2024-07-30 05:07:10,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 470/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 1.9601353e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:10,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.65867 samples/s/p 1:02:33 } +2024-07-30 05:07:13,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 472/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 1.9573924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:13,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.65793 samples/s/p 1:02:31 } +2024-07-30 05:07:16,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 474/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 1.9546515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:16,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.66085 samples/s/p 1:02:26 } +2024-07-30 05:07:19,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 476/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 1.9519123e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:19,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.66125 samples/s/p 1:02:23 } +2024-07-30 05:07:22,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 478/ 3125], loss: 0.275, per_step_time: 1412ms, lr: 1.9491736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:22,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.66282 samples/s/p 1:02:19 } +2024-07-30 05:07:25,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 480/ 3125], loss: 0.237, per_step_time: 1412ms, lr: 1.9464371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:25,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.66264 samples/s/p 1:02:16 } +2024-07-30 05:07:27,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 482/ 3125], loss: 0.415, per_step_time: 1413ms, lr: 1.9437023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:27,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.65973 samples/s/p 1:02:15 } +2024-07-30 05:07:30,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 484/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 1.9409688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:30,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.66082 samples/s/p 1:02:12 } +2024-07-30 05:07:33,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 486/ 3125], loss: 0.109, per_step_time: 1413ms, lr: 1.938237e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:33,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.66120 samples/s/p 1:02:09 } +2024-07-30 05:07:36,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 488/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 1.9355055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:36,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.65990 samples/s/p 1:02:07 } +2024-07-30 05:07:39,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 490/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 1.9327765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:39,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.66090 samples/s/p 1:02:03 } +2024-07-30 05:07:42,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 492/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 1.930049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:42,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.66111 samples/s/p 1:02:00 } +2024-07-30 05:07:44,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 494/ 3125], loss: 0.271, per_step_time: 1414ms, lr: 1.9273227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:44,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.65759 samples/s/p 1:02:00 } +2024-07-30 05:07:47,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 496/ 3125], loss: 0.438, per_step_time: 1413ms, lr: 1.924598e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:47,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |███████████████████████████████████ | 5.66047 samples/s/p 1:01:55 } +2024-07-30 05:07:50,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 498/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 1.9218742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:50,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |███████████████████████████████████ | 5.65830 samples/s/p 1:01:54 } +2024-07-30 05:07:53,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 500/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 1.9191523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:53,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.66027 samples/s/p 1:01:50 } +2024-07-30 05:07:56,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 502/ 3125], loss: 0.083, per_step_time: 1414ms, lr: 1.916431e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:56,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.65454 samples/s/p 1:01:50 } +2024-07-30 05:07:59,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 504/ 3125], loss: 0.214, per_step_time: 1414ms, lr: 1.9137126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:59,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.65698 samples/s/p 1:01:46 } +2024-07-30 05:08:01,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 506/ 3125], loss: 0.513, per_step_time: 1414ms, lr: 1.9109953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:01,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.65758 samples/s/p 1:01:43 } +2024-07-30 05:08:04,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 508/ 3125], loss: 0.122, per_step_time: 1418ms, lr: 1.9082795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:04,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.63883 samples/s/p 1:01:52 } +2024-07-30 05:08:07,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 510/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 1.9055652e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:07,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.66004 samples/s/p 1:01:36 } +2024-07-30 05:08:10,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 512/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 1.9028523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:10,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.65946 samples/s/p 1:01:33 } +2024-07-30 05:08:13,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 514/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 1.9001409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:13,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.66081 samples/s/p 1:01:29 } +2024-07-30 05:08:16,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 516/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 1.89743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:16,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.65977 samples/s/p 1:01:27 } +2024-07-30 05:08:18,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 518/ 3125], loss: 0.083, per_step_time: 1414ms, lr: 1.8947217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:18,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.65757 samples/s/p 1:01:26 } +2024-07-30 05:08:21,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 520/ 3125], loss: 0.139, per_step_time: 1415ms, lr: 1.8920147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:21,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.65004 samples/s/p 1:01:28 } +2024-07-30 05:08:24,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 522/ 3125], loss: 0.269, per_step_time: 1414ms, lr: 1.8893084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:24,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.65651 samples/s/p 1:01:21 } +2024-07-30 05:08:27,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 524/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 1.8866044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:27,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.66002 samples/s/p 1:01:16 } +2024-07-30 05:08:30,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 526/ 3125], loss: 0.138, per_step_time: 1414ms, lr: 1.8839019e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:30,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.65712 samples/s/p 1:01:15 } +2024-07-30 05:08:33,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 528/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 1.8812009e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:33,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.65927 samples/s/p 1:01:11 } +2024-07-30 05:08:35,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 530/ 3125], loss: 0.005, per_step_time: 1412ms, lr: 1.8785005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:35,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.66307 samples/s/p 1:01:05 } +2024-07-30 05:08:38,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 532/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 1.8758026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:38,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.65824 samples/s/p 1:01:06 } +2024-07-30 05:08:41,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 534/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 1.873106e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:41,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.66126 samples/s/p 1:01:01 } +2024-07-30 05:08:44,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 536/ 3125], loss: 0.301, per_step_time: 1413ms, lr: 1.870411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:44,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.65977 samples/s/p 1:00:59 } +2024-07-30 05:08:47,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 538/ 3125], loss: 0.510, per_step_time: 1413ms, lr: 1.8677174e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:47,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.65961 samples/s/p 1:00:56 } +2024-07-30 05:08:50,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 540/ 3125], loss: 0.125, per_step_time: 1414ms, lr: 1.8650254e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:50,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.65514 samples/s/p 1:00:56 } +2024-07-30 05:08:52,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 542/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 1.862334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:52,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.66007 samples/s/p 1:00:50 } +2024-07-30 05:08:55,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 544/ 3125], loss: 0.156, per_step_time: 1412ms, lr: 1.859645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:55,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.66212 samples/s/p 1:00:46 } +2024-07-30 05:08:58,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 546/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 1.8569565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:58,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.66136 samples/s/p 1:00:44 } +2024-07-30 05:09:01,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 548/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 1.8542704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:01,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.66123 samples/s/p 1:00:41 } +2024-07-30 05:09:04,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 550/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 1.8515858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:04,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.66100 samples/s/p 1:00:38 } +2024-07-30 05:09:07,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 552/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 1.8489027e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:07,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.66132 samples/s/p 1:00:35 } +2024-07-30 05:09:09,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 554/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 1.8462214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:09,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.66007 samples/s/p 1:00:33 } +2024-07-30 05:09:12,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 556/ 3125], loss: 0.197, per_step_time: 1413ms, lr: 1.8435412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:12,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.66084 samples/s/p 1:00:30 } +2024-07-30 05:09:15,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 558/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 1.8408629e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:15,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.65906 samples/s/p 1:00:28 } +2024-07-30 05:09:18,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 560/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 1.8381849e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:18,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.65755 samples/s/p 1:00:27 } +2024-07-30 05:09:21,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 562/ 3125], loss: 0.268, per_step_time: 1417ms, lr: 1.8355095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:21,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.64539 samples/s/p 1:00:31 } +2024-07-30 05:09:24,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 564/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 1.8328357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:24,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.65984 samples/s/p 1:00:19 } +2024-07-30 05:09:26,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 566/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 1.8301621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:26,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.66117 samples/s/p 1:00:16 } +2024-07-30 05:09:29,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 568/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 1.8274911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:29,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.65959 samples/s/p 1:00:14 } +2024-07-30 05:09:32,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 570/ 3125], loss: 0.294, per_step_time: 1413ms, lr: 1.8248218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:32,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.66156 samples/s/p 1:00:10 } +2024-07-30 05:09:35,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 572/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 1.8221535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:35,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.65781 samples/s/p 1:00:09 } +2024-07-30 05:09:38,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 574/ 3125], loss: 0.064, per_step_time: 1414ms, lr: 1.8194863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:38,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.65751 samples/s/p 1:00:07 } +2024-07-30 05:09:41,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 576/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 1.8168216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:41,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.65794 samples/s/p 1:00:04 } +2024-07-30 05:09:43,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 578/ 3125], loss: 0.265, per_step_time: 1415ms, lr: 1.8141582e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:43,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.65317 samples/s/p 1:00:04 } +2024-07-30 05:09:46,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 580/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 1.8114963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:46,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.66051 samples/s/p 0:59:56 } +2024-07-30 05:09:49,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 582/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 1.8088361e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:49,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.66083 samples/s/p 0:59:53 } +2024-07-30 05:09:52,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 584/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 1.8061771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:52,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.66071 samples/s/p 0:59:51 } +2024-07-30 05:09:55,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 586/ 3125], loss: 0.202, per_step_time: 1414ms, lr: 1.8035188e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:55,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.65568 samples/s/p 0:59:51 } +2024-07-30 05:09:58,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 588/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 1.8008631e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:58,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.66065 samples/s/p 0:59:45 } +2024-07-30 05:10:00,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 590/ 3125], loss: 0.138, per_step_time: 1415ms, lr: 1.798208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:00,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.65227 samples/s/p 0:59:47 } +2024-07-30 05:10:03,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 592/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 1.7955554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:03,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.65957 samples/s/p 0:59:40 } +2024-07-30 05:10:06,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 594/ 3125], loss: 0.130, per_step_time: 1413ms, lr: 1.7929044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:06,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.66125 samples/s/p 0:59:36 } +2024-07-30 05:10:09,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 596/ 3125], loss: 0.277, per_step_time: 1412ms, lr: 1.7902544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:09,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.66190 samples/s/p 0:59:33 } +2024-07-30 05:10:12,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 598/ 3125], loss: 0.323, per_step_time: 1413ms, lr: 1.7876064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:12,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.66085 samples/s/p 0:59:31 } +2024-07-30 05:10:15,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 600/ 3125], loss: 0.395, per_step_time: 1413ms, lr: 1.7849596e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:15,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.66148 samples/s/p 0:59:27 } +2024-07-30 05:10:17,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 602/ 3125], loss: 0.266, per_step_time: 1414ms, lr: 1.7823138e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:17,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.65624 samples/s/p 0:59:28 } +2024-07-30 05:10:20,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 604/ 3125], loss: 0.134, per_step_time: 1413ms, lr: 1.7796704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:20,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.65960 samples/s/p 0:59:23 } +2024-07-30 05:10:23,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 606/ 3125], loss: 0.142, per_step_time: 1413ms, lr: 1.7770287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:23,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.65895 samples/s/p 0:59:21 } +2024-07-30 05:10:26,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 608/ 3125], loss: 0.591, per_step_time: 1413ms, lr: 1.7743882e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:26,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.65948 samples/s/p 0:59:17 } +2024-07-30 05:10:29,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 610/ 3125], loss: 0.108, per_step_time: 1414ms, lr: 1.771748e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:29,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.65672 samples/s/p 0:59:16 } +2024-07-30 05:10:32,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 612/ 3125], loss: 0.229, per_step_time: 1415ms, lr: 1.7691108e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:32,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.65274 samples/s/p 0:59:16 } +2024-07-30 05:10:34,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 614/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 1.7664751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:34,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.66082 samples/s/p 0:59:08 } +2024-07-30 05:10:37,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 616/ 3125], loss: 0.183, per_step_time: 1414ms, lr: 1.7638399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:37,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.65749 samples/s/p 0:59:07 } +2024-07-30 05:10:40,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 618/ 3125], loss: 0.164, per_step_time: 1414ms, lr: 1.7612073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:40,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.65735 samples/s/p 0:59:05 } +2024-07-30 05:10:43,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 620/ 3125], loss: 0.065, per_step_time: 1412ms, lr: 1.758576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:43,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.66263 samples/s/p 0:58:58 } +2024-07-30 05:10:46,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 622/ 3125], loss: 0.277, per_step_time: 1412ms, lr: 1.7559465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:46,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.66183 samples/s/p 0:58:56 } +2024-07-30 05:10:49,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 624/ 3125], loss: 0.520, per_step_time: 1413ms, lr: 1.7533185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:49,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.66018 samples/s/p 0:58:54 } +2024-07-30 05:10:51,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 626/ 3125], loss: 0.100, per_step_time: 1413ms, lr: 1.750692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:51,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.66007 samples/s/p 0:58:52 } +2024-07-30 05:10:54,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 628/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 1.7480671e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:54,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.66046 samples/s/p 0:58:49 } +2024-07-30 05:10:57,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 630/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 1.7454427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:57,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.65897 samples/s/p 0:58:47 } +2024-07-30 05:11:00,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 632/ 3125], loss: 0.305, per_step_time: 1415ms, lr: 1.7428207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:00,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.65257 samples/s/p 0:58:48 } +2024-07-30 05:11:03,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 634/ 3125], loss: 0.278, per_step_time: 1415ms, lr: 1.7401995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:03,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.65112 samples/s/p 0:58:46 } +2024-07-30 05:11:06,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 636/ 3125], loss: 0.082, per_step_time: 1412ms, lr: 1.7375809e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:06,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.66195 samples/s/p 0:58:36 } +2024-07-30 05:11:08,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 638/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 1.7349636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:08,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.65933 samples/s/p 0:58:35 } +2024-07-30 05:11:11,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 640/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 1.7323479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:11,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.66044 samples/s/p 0:58:32 } +2024-07-30 05:11:14,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 642/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 1.7297339e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:14,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.66068 samples/s/p 0:58:29 } +2024-07-30 05:11:17,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 644/ 3125], loss: 0.400, per_step_time: 1413ms, lr: 1.7271215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:17,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.66006 samples/s/p 0:58:26 } +2024-07-30 05:11:20,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 646/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 1.7245095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:20,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.66120 samples/s/p 0:58:23 } +2024-07-30 05:11:23,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 648/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 1.7219004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:23,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.66019 samples/s/p 0:58:20 } +2024-07-30 05:11:25,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 650/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 1.7192924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:25,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.65879 samples/s/p 0:58:18 } +2024-07-30 05:11:28,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 652/ 3125], loss: 0.326, per_step_time: 1414ms, lr: 1.7166861e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:28,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.65445 samples/s/p 0:58:18 } +2024-07-30 05:11:31,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 654/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 1.7140806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:31,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.66037 samples/s/p 0:58:12 } +2024-07-30 05:11:34,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 656/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 1.7114774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:34,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.66085 samples/s/p 0:58:09 } +2024-07-30 05:11:37,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 658/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 1.7088759e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:37,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.65938 samples/s/p 0:58:07 } +2024-07-30 05:11:40,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 660/ 3125], loss: 0.120, per_step_time: 1412ms, lr: 1.706275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:40,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.66190 samples/s/p 0:58:02 } +2024-07-30 05:11:42,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 662/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 1.7036765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:42,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.65977 samples/s/p 0:58:01 } +2024-07-30 05:11:45,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 664/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 1.7010799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:45,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.65921 samples/s/p 0:57:58 } +2024-07-30 05:11:48,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 666/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 1.6984844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:48,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.65800 samples/s/p 0:57:56 } +2024-07-30 05:11:51,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 668/ 3125], loss: 0.145, per_step_time: 1413ms, lr: 1.695891e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:51,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.66086 samples/s/p 0:57:52 } +2024-07-30 05:11:54,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 670/ 3125], loss: 0.207, per_step_time: 1414ms, lr: 1.6932988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:54,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.65701 samples/s/p 0:57:51 } +2024-07-30 05:11:57,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 672/ 3125], loss: 0.271, per_step_time: 1415ms, lr: 1.690708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:57,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.65025 samples/s/p 0:57:53 } +2024-07-30 05:11:59,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 674/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 1.6881182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:59,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.65961 samples/s/p 0:57:44 } +2024-07-30 05:12:02,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 676/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 1.6855311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:02,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.65774 samples/s/p 0:57:42 } +2024-07-30 05:12:05,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 678/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 1.6829442e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:05,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.66041 samples/s/p 0:57:38 } +2024-07-30 05:12:08,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 680/ 3125], loss: 0.234, per_step_time: 1412ms, lr: 1.6803601e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:08,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.66220 samples/s/p 0:57:34 } +2024-07-30 05:12:11,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 682/ 3125], loss: 0.263, per_step_time: 1414ms, lr: 1.6777774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:11,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.65714 samples/s/p 0:57:34 } +2024-07-30 05:12:14,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 684/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 1.6751966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:14,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |████████████████████████████████████ | 5.66131 samples/s/p 0:57:29 } +2024-07-30 05:12:16,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 686/ 3125], loss: 0.592, per_step_time: 1413ms, lr: 1.6726168e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:16,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |████████████████████████████████████ | 5.66021 samples/s/p 0:57:27 } +2024-07-30 05:12:19,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 688/ 3125], loss: 0.160, per_step_time: 1413ms, lr: 1.670038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:19,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.66104 samples/s/p 0:57:23 } +2024-07-30 05:12:22,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 690/ 3125], loss: 0.201, per_step_time: 1414ms, lr: 1.6674619e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:22,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.65620 samples/s/p 0:57:24 } +2024-07-30 05:12:25,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 692/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 1.6648873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:25,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.65949 samples/s/p 0:57:19 } +2024-07-30 05:12:28,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 694/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 1.6623145e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:28,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.66126 samples/s/p 0:57:15 } +2024-07-30 05:12:31,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 696/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 1.6597429e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:31,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.66155 samples/s/p 0:57:12 } +2024-07-30 05:12:33,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 698/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 1.657173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:33,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.66076 samples/s/p 0:57:09 } +2024-07-30 05:12:36,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 700/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 1.6546037e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:36,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.66143 samples/s/p 0:57:06 } +2024-07-30 05:12:39,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 702/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 1.6520369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:39,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.65835 samples/s/p 0:57:05 } +2024-07-30 05:12:42,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 704/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 1.6494708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:42,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.65867 samples/s/p 0:57:02 } +2024-07-30 05:12:45,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 706/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 1.6469075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:45,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.65805 samples/s/p 0:57:00 } +2024-07-30 05:12:48,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 708/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 1.6443457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:48,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.65767 samples/s/p 0:56:57 } +2024-07-30 05:12:50,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 710/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 1.6417855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:50,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.65828 samples/s/p 0:56:54 } +2024-07-30 05:12:53,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 712/ 3125], loss: 0.073, per_step_time: 1413ms, lr: 1.6392266e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:53,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.65848 samples/s/p 0:56:51 } +2024-07-30 05:12:56,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 714/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 1.6366696e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:56,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.66052 samples/s/p 0:56:47 } +2024-07-30 05:12:59,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 716/ 3125], loss: 0.282, per_step_time: 1414ms, lr: 1.6341144e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:59,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.65715 samples/s/p 0:56:46 } +2024-07-30 05:13:02,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 718/ 3125], loss: 0.419, per_step_time: 1413ms, lr: 1.6315594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:02,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.66111 samples/s/p 0:56:41 } +2024-07-30 05:13:05,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 720/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 1.6290071e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:05,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.65971 samples/s/p 0:56:39 } +2024-07-30 05:13:07,991 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 722/ 3125], loss: 0.433, per_step_time: 1413ms, lr: 1.6264567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:07,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.65991 samples/s/p 0:56:36 } +2024-07-30 05:13:10,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 724/ 3125], loss: 0.184, per_step_time: 1414ms, lr: 1.6239064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:10,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.65715 samples/s/p 0:56:35 } +2024-07-30 05:13:13,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 726/ 3125], loss: 0.217, per_step_time: 1414ms, lr: 1.6213589e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:13,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.65727 samples/s/p 0:56:32 } +2024-07-30 05:13:16,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 728/ 3125], loss: 0.267, per_step_time: 1414ms, lr: 1.6188135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:16,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.65728 samples/s/p 0:56:29 } +2024-07-30 05:13:19,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 730/ 3125], loss: 0.191, per_step_time: 1412ms, lr: 1.6162691e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:19,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.66256 samples/s/p 0:56:23 } +2024-07-30 05:13:22,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 732/ 3125], loss: 0.114, per_step_time: 1413ms, lr: 1.6137257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:22,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.66024 samples/s/p 0:56:22 } +2024-07-30 05:13:24,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 734/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 1.6111848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:24,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.65782 samples/s/p 0:56:20 } +2024-07-30 05:13:27,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 736/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 1.6086453e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:27,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.65905 samples/s/p 0:56:17 } +2024-07-30 05:13:30,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 738/ 3125], loss: 0.389, per_step_time: 1414ms, lr: 1.6061076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:30,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.65610 samples/s/p 0:56:16 } +2024-07-30 05:13:33,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 740/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 1.6035715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:33,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.65860 samples/s/p 0:56:11 } +2024-07-30 05:13:36,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 742/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 1.6010371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:36,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.65984 samples/s/p 0:56:08 } +2024-07-30 05:13:39,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 744/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 1.5985032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:39,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.66101 samples/s/p 0:56:04 } +2024-07-30 05:13:42,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 746/ 3125], loss: 0.112, per_step_time: 1413ms, lr: 1.5959721e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:42,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.66075 samples/s/p 0:56:02 } +2024-07-30 05:13:44,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 748/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 1.5934413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:44,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.66021 samples/s/p 0:55:59 } +2024-07-30 05:13:47,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 750/ 3125], loss: 0.348, per_step_time: 1413ms, lr: 1.5909135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:47,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.65934 samples/s/p 0:55:57 } +2024-07-30 05:13:47,670 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 05:14:24,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 752/ 3125], loss: 0.167, per_step_time: 1417ms, lr: 1.5883871e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:24,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.64290 samples/s/p 0:56:04 } +2024-07-30 05:14:26,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 754/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 1.5858626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:26,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.65876 samples/s/p 0:55:51 } +2024-07-30 05:14:29,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 756/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 1.5833392e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:29,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.66064 samples/s/p 0:55:48 } +2024-07-30 05:14:32,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 758/ 3125], loss: 0.194, per_step_time: 1414ms, lr: 1.5808176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:32,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.65674 samples/s/p 0:55:47 } +2024-07-30 05:14:35,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 760/ 3125], loss: 0.140, per_step_time: 1415ms, lr: 1.5782979e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:35,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.65178 samples/s/p 0:55:47 } +2024-07-30 05:14:38,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 762/ 3125], loss: 0.289, per_step_time: 1414ms, lr: 1.5757787e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:38,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.65449 samples/s/p 0:55:43 } +2024-07-30 05:14:41,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 764/ 3125], loss: 0.270, per_step_time: 1412ms, lr: 1.5732625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:41,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.66184 samples/s/p 0:55:36 } +2024-07-30 05:14:44,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 766/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 1.5707475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:44,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.66044 samples/s/p 0:55:34 } +2024-07-30 05:14:47,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 768/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 1.5682333e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:47,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.66032 samples/s/p 0:55:31 } +2024-07-30 05:14:50,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 770/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 1.5657216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:50,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.66109 samples/s/p 0:55:27 } +2024-07-30 05:14:53,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 772/ 3125], loss: 0.538, per_step_time: 1413ms, lr: 1.5632113e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:53,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.66076 samples/s/p 0:55:25 } +2024-07-30 05:14:55,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 774/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 1.5607031e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:55,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.66113 samples/s/p 0:55:22 } +2024-07-30 05:14:58,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 776/ 3125], loss: 0.176, per_step_time: 1412ms, lr: 1.5581957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:58,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.66193 samples/s/p 0:55:19 } +2024-07-30 05:15:01,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 778/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 1.5556905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:01,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.65922 samples/s/p 0:55:17 } +2024-07-30 05:15:04,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 780/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 1.5531871e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:04,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.66104 samples/s/p 0:55:13 } +2024-07-30 05:15:07,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 782/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 1.5506852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:07,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.65998 samples/s/p 0:55:11 } +2024-07-30 05:15:10,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 784/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 1.548185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:10,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.66053 samples/s/p 0:55:08 } +2024-07-30 05:15:13,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 786/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 1.5456867e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:13,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.65909 samples/s/p 0:55:06 } +2024-07-30 05:15:16,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 788/ 3125], loss: 0.313, per_step_time: 1414ms, lr: 1.543189e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:16,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.65660 samples/s/p 0:55:05 } +2024-07-30 05:15:19,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 790/ 3125], loss: 0.309, per_step_time: 1414ms, lr: 1.5406936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:19,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.65440 samples/s/p 0:55:03 } +2024-07-30 05:15:22,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 792/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 1.5381992e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:22,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.65885 samples/s/p 0:54:58 } +2024-07-30 05:15:24,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 794/ 3125], loss: 0.405, per_step_time: 1413ms, lr: 1.5357074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:24,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.65915 samples/s/p 0:54:55 } +2024-07-30 05:15:27,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 796/ 3125], loss: 0.059, per_step_time: 1414ms, lr: 1.5332171e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:27,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.65432 samples/s/p 0:54:55 } +2024-07-30 05:15:30,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 798/ 3125], loss: 0.459, per_step_time: 1414ms, lr: 1.5307284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:30,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.65374 samples/s/p 0:54:52 } +2024-07-30 05:15:33,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 800/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 1.5282416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:33,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.65794 samples/s/p 0:54:47 } +2024-07-30 05:15:36,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 802/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 1.525756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:36,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.65810 samples/s/p 0:54:44 } +2024-07-30 05:15:39,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 804/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 1.5232717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:39,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.66133 samples/s/p 0:54:39 } +2024-07-30 05:15:42,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 806/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 1.5207895e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:42,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.65850 samples/s/p 0:54:38 } +2024-07-30 05:15:44,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 808/ 3125], loss: 0.235, per_step_time: 1413ms, lr: 1.5183094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:44,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.66005 samples/s/p 0:54:34 } +2024-07-30 05:15:47,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 810/ 3125], loss: 0.235, per_step_time: 1413ms, lr: 1.5158307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:47,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.65979 samples/s/p 0:54:32 } +2024-07-30 05:15:50,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 812/ 3125], loss: 0.385, per_step_time: 1412ms, lr: 1.5133529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:50,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.66181 samples/s/p 0:54:28 } +2024-07-30 05:15:53,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 814/ 3125], loss: 0.359, per_step_time: 1414ms, lr: 1.5108776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:53,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.65649 samples/s/p 0:54:28 } +2024-07-30 05:15:56,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 816/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 1.508404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:56,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.66026 samples/s/p 0:54:23 } +2024-07-30 05:15:59,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 818/ 3125], loss: 0.181, per_step_time: 1415ms, lr: 1.5059313e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:59,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.65131 samples/s/p 0:54:25 } +2024-07-30 05:16:01,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 820/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 1.5034607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:01,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.66140 samples/s/p 0:54:17 } +2024-07-30 05:16:04,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 822/ 3125], loss: 0.343, per_step_time: 1415ms, lr: 1.5009921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:04,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.65079 samples/s/p 0:54:20 } +2024-07-30 05:16:07,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 824/ 3125], loss: 0.420, per_step_time: 1413ms, lr: 1.4985251e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:07,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.66154 samples/s/p 0:54:11 } +2024-07-30 05:16:10,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 826/ 3125], loss: 0.120, per_step_time: 1415ms, lr: 1.4960599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:10,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.65000 samples/s/p 0:54:15 } +2024-07-30 05:16:13,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 828/ 3125], loss: 0.141, per_step_time: 1414ms, lr: 1.4935964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:13,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.65387 samples/s/p 0:54:10 } +2024-07-30 05:16:16,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 830/ 3125], loss: 0.413, per_step_time: 1414ms, lr: 1.4911344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:16,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.65501 samples/s/p 0:54:06 } +2024-07-30 05:16:18,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 832/ 3125], loss: 0.234, per_step_time: 1414ms, lr: 1.4886731e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:18,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.65483 samples/s/p 0:54:03 } +2024-07-30 05:16:21,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 834/ 3125], loss: 0.438, per_step_time: 1412ms, lr: 1.4862144e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:21,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.66341 samples/s/p 0:53:56 } +2024-07-30 05:16:24,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 836/ 3125], loss: 0.238, per_step_time: 1412ms, lr: 1.4837568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:24,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.66301 samples/s/p 0:53:53 } +2024-07-30 05:16:27,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 838/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 1.4813014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:27,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.66125 samples/s/p 0:53:51 } +2024-07-30 05:16:30,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 840/ 3125], loss: 0.145, per_step_time: 1413ms, lr: 1.4788482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:30,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.65881 samples/s/p 0:53:50 } +2024-07-30 05:16:33,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 842/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 1.4763963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:33,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.65895 samples/s/p 0:53:47 } +2024-07-30 05:16:35,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 844/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 1.473946e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:35,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.65917 samples/s/p 0:53:44 } +2024-07-30 05:16:38,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 846/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 1.4714974e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:38,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.66035 samples/s/p 0:53:40 } +2024-07-30 05:16:41,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 848/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 1.4690497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:41,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.66113 samples/s/p 0:53:37 } +2024-07-30 05:16:44,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 850/ 3125], loss: 0.104, per_step_time: 1413ms, lr: 1.4666044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:44,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.65973 samples/s/p 0:53:35 } +2024-07-30 05:16:47,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 852/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 1.4641612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:47,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.66114 samples/s/p 0:53:32 } +2024-07-30 05:16:50,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 854/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 1.4617192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:50,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.65959 samples/s/p 0:53:30 } +2024-07-30 05:16:52,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 856/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 1.4592785e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:52,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.66008 samples/s/p 0:53:27 } +2024-07-30 05:16:55,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 858/ 3125], loss: 0.118, per_step_time: 1414ms, lr: 1.45684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:55,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.65616 samples/s/p 0:53:26 } +2024-07-30 05:16:58,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 860/ 3125], loss: 0.421, per_step_time: 1415ms, lr: 1.4544033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:58,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.65183 samples/s/p 0:53:26 } +2024-07-30 05:17:01,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 862/ 3125], loss: 0.449, per_step_time: 1414ms, lr: 1.4519674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:01,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.65737 samples/s/p 0:53:20 } +2024-07-30 05:17:04,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 864/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 1.4495342e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:04,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.66075 samples/s/p 0:53:15 } +2024-07-30 05:17:07,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 866/ 3125], loss: 0.387, per_step_time: 1415ms, lr: 1.4471024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:07,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.65092 samples/s/p 0:53:18 } +2024-07-30 05:17:09,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 868/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 1.4446726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:09,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.65988 samples/s/p 0:53:10 } +2024-07-30 05:17:12,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 870/ 3125], loss: 0.101, per_step_time: 1413ms, lr: 1.4422443e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:12,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.66031 samples/s/p 0:53:07 } +2024-07-30 05:17:15,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 872/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 1.4398178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:15,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |█████████████████████████████████████ | 5.66059 samples/s/p 0:53:04 } +2024-07-30 05:17:18,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 874/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 1.4373928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:18,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |█████████████████████████████████████ | 5.66060 samples/s/p 0:53:01 } +2024-07-30 05:17:21,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 876/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 1.434969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:21,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.66095 samples/s/p 0:52:58 } +2024-07-30 05:17:24,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 878/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 1.4325475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:24,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.66004 samples/s/p 0:52:55 } +2024-07-30 05:17:26,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 880/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 1.430127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:26,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.66160 samples/s/p 0:52:52 } +2024-07-30 05:17:29,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 882/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 1.4277089e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:29,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.65942 samples/s/p 0:52:50 } +2024-07-30 05:17:32,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 884/ 3125], loss: 0.320, per_step_time: 1413ms, lr: 1.4252928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:32,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.65913 samples/s/p 0:52:47 } +2024-07-30 05:17:35,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 886/ 3125], loss: 0.484, per_step_time: 1413ms, lr: 1.4228782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:35,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.65871 samples/s/p 0:52:45 } +2024-07-30 05:17:38,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 888/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 1.4204651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:38,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.66123 samples/s/p 0:52:41 } +2024-07-30 05:17:41,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 890/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 1.4180529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:41,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.66034 samples/s/p 0:52:38 } +2024-07-30 05:17:43,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 892/ 3125], loss: 0.288, per_step_time: 1414ms, lr: 1.4156436e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:43,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.65625 samples/s/p 0:52:38 } +2024-07-30 05:17:46,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 894/ 3125], loss: 0.214, per_step_time: 1414ms, lr: 1.413236e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:46,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.65715 samples/s/p 0:52:34 } +2024-07-30 05:17:49,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 896/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 1.41083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:49,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.65969 samples/s/p 0:52:30 } +2024-07-30 05:17:52,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 898/ 3125], loss: 0.380, per_step_time: 1413ms, lr: 1.4084255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:52,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.65992 samples/s/p 0:52:27 } +2024-07-30 05:17:55,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 900/ 3125], loss: 0.492, per_step_time: 1413ms, lr: 1.406022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:55,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.65913 samples/s/p 0:52:25 } +2024-07-30 05:17:58,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 902/ 3125], loss: 0.128, per_step_time: 1414ms, lr: 1.4036211e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:58,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.65583 samples/s/p 0:52:24 } +2024-07-30 05:18:00,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 904/ 3125], loss: 0.187, per_step_time: 1418ms, lr: 1.401222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:00,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.63887 samples/s/p 0:52:30 } +2024-07-30 05:18:03,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 906/ 3125], loss: 0.287, per_step_time: 1414ms, lr: 1.3988235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:03,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.65426 samples/s/p 0:52:19 } +2024-07-30 05:18:06,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 908/ 3125], loss: 0.194, per_step_time: 1414ms, lr: 1.396428e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:06,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.65681 samples/s/p 0:52:15 } +2024-07-30 05:18:09,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 910/ 3125], loss: 0.370, per_step_time: 1414ms, lr: 1.3940337e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:09,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.65703 samples/s/p 0:52:12 } +2024-07-30 05:18:12,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 912/ 3125], loss: 0.139, per_step_time: 1414ms, lr: 1.3916415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:12,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.65728 samples/s/p 0:52:09 } +2024-07-30 05:18:15,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 914/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 1.389251e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:15,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.65953 samples/s/p 0:52:05 } +2024-07-30 05:18:17,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 916/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 1.3868621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:17,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.65996 samples/s/p 0:52:02 } +2024-07-30 05:18:20,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 918/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 1.3844749e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:20,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.65982 samples/s/p 0:51:59 } +2024-07-30 05:18:23,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 920/ 3125], loss: 0.399, per_step_time: 1413ms, lr: 1.3820886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:23,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.66067 samples/s/p 0:51:56 } +2024-07-30 05:18:26,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 922/ 3125], loss: 0.454, per_step_time: 1413ms, lr: 1.379705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:26,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.65890 samples/s/p 0:51:54 } +2024-07-30 05:18:29,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 924/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 1.3773221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:29,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.66130 samples/s/p 0:51:50 } +2024-07-30 05:18:32,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 926/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 1.374942e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:32,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.66136 samples/s/p 0:51:47 } +2024-07-30 05:18:34,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 928/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 1.3725635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:34,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.65996 samples/s/p 0:51:45 } +2024-07-30 05:18:37,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 930/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 1.3701865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:37,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.65939 samples/s/p 0:51:42 } +2024-07-30 05:18:40,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 932/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 1.3678115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:40,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.65803 samples/s/p 0:51:40 } +2024-07-30 05:18:43,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 934/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 1.3654375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:43,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.65906 samples/s/p 0:51:37 } +2024-07-30 05:18:46,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 936/ 3125], loss: 0.172, per_step_time: 1414ms, lr: 1.3630661e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:46,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.65496 samples/s/p 0:51:36 } +2024-07-30 05:18:49,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 938/ 3125], loss: 0.381, per_step_time: 1413ms, lr: 1.3606963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:49,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.65966 samples/s/p 0:51:31 } +2024-07-30 05:18:51,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 940/ 3125], loss: 0.368, per_step_time: 1413ms, lr: 1.3583282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:51,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.65817 samples/s/p 0:51:29 } +2024-07-30 05:18:54,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 942/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 1.3559616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:54,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.66138 samples/s/p 0:51:24 } +2024-07-30 05:18:57,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 944/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 1.3535961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:57,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.65841 samples/s/p 0:51:23 } +2024-07-30 05:19:00,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 946/ 3125], loss: 0.322, per_step_time: 1413ms, lr: 1.3512334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:00,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.66030 samples/s/p 0:51:19 } +2024-07-30 05:19:03,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 948/ 3125], loss: 0.154, per_step_time: 1412ms, lr: 1.3488716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:03,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.66189 samples/s/p 0:51:16 } +2024-07-30 05:19:06,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 950/ 3125], loss: 0.323, per_step_time: 1417ms, lr: 1.3465121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:06,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.64269 samples/s/p 0:51:23 } +2024-07-30 05:19:08,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 952/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 1.3441542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:08,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.65889 samples/s/p 0:51:11 } +2024-07-30 05:19:11,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 954/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 1.3417986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:11,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.65991 samples/s/p 0:51:08 } +2024-07-30 05:19:14,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 956/ 3125], loss: 0.491, per_step_time: 1413ms, lr: 1.3394442e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:14,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.66055 samples/s/p 0:51:05 } +2024-07-30 05:19:17,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 958/ 3125], loss: 0.460, per_step_time: 1413ms, lr: 1.3370919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:17,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.65886 samples/s/p 0:51:03 } +2024-07-30 05:19:20,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 960/ 3125], loss: 0.228, per_step_time: 1414ms, lr: 1.3347413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:20,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.65770 samples/s/p 0:51:01 } +2024-07-30 05:19:23,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 962/ 3125], loss: 0.367, per_step_time: 1413ms, lr: 1.3323923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:23,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.65906 samples/s/p 0:50:57 } +2024-07-30 05:19:25,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 964/ 3125], loss: 0.162, per_step_time: 1414ms, lr: 1.3300445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:25,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.65657 samples/s/p 0:50:56 } +2024-07-30 05:19:28,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 966/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 1.3276988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:28,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.65977 samples/s/p 0:50:51 } +2024-07-30 05:19:31,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 968/ 3125], loss: 0.222, per_step_time: 1414ms, lr: 1.3253546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:31,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.65648 samples/s/p 0:50:50 } +2024-07-30 05:19:34,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 970/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 1.3230127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:34,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.66115 samples/s/p 0:50:45 } +2024-07-30 05:19:37,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 972/ 3125], loss: 0.278, per_step_time: 1414ms, lr: 1.3206726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:37,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.65765 samples/s/p 0:50:44 } +2024-07-30 05:19:40,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 974/ 3125], loss: 0.165, per_step_time: 1414ms, lr: 1.3183341e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:40,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.65763 samples/s/p 0:50:41 } +2024-07-30 05:19:42,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 976/ 3125], loss: 0.179, per_step_time: 1414ms, lr: 1.3159975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:42,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.65583 samples/s/p 0:50:39 } +2024-07-30 05:19:45,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 978/ 3125], loss: 0.212, per_step_time: 1415ms, lr: 1.3136619e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:45,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.65240 samples/s/p 0:50:38 } +2024-07-30 05:19:48,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 980/ 3125], loss: 0.332, per_step_time: 1416ms, lr: 1.3113287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:48,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.64601 samples/s/p 0:50:39 } +2024-07-30 05:19:51,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 982/ 3125], loss: 0.478, per_step_time: 1414ms, lr: 1.3089972e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:51,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.65415 samples/s/p 0:50:32 } +2024-07-30 05:19:54,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 984/ 3125], loss: 0.330, per_step_time: 1412ms, lr: 1.3066679e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:54,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.66226 samples/s/p 0:50:24 } +2024-07-30 05:19:57,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 986/ 3125], loss: 0.351, per_step_time: 1414ms, lr: 1.30434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:57,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.65592 samples/s/p 0:50:25 } +2024-07-30 05:19:59,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 988/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 1.302014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:59,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.66112 samples/s/p 0:50:19 } +2024-07-30 05:20:02,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 990/ 3125], loss: 0.295, per_step_time: 1412ms, lr: 1.2996887e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:02,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.66192 samples/s/p 0:50:16 } +2024-07-30 05:20:05,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 992/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 1.2973654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:05,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.65904 samples/s/p 0:50:15 } +2024-07-30 05:20:08,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 994/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 1.2950447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:08,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.65855 samples/s/p 0:50:12 } +2024-07-30 05:20:11,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 996/ 3125], loss: 0.069, per_step_time: 1413ms, lr: 1.2927258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:11,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.66029 samples/s/p 0:50:09 } +2024-07-30 05:20:14,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 998/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 1.2904086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:14,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.65982 samples/s/p 0:50:06 } +2024-07-30 05:20:16,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1000/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 1.288093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:16,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.66159 samples/s/p 0:50:02 } +2024-07-30 05:20:19,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1002/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 1.2857795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:19,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.66040 samples/s/p 0:50:00 } +2024-07-30 05:20:22,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1004/ 3125], loss: 0.308, per_step_time: 1412ms, lr: 1.2834673e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:22,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.66205 samples/s/p 0:49:56 } +2024-07-30 05:20:25,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1006/ 3125], loss: 0.276, per_step_time: 1415ms, lr: 1.2811565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:25,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.65181 samples/s/p 0:49:59 } +2024-07-30 05:20:28,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1008/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 1.2788483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:28,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.65824 samples/s/p 0:49:53 } +2024-07-30 05:20:31,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1010/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 1.2765416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:31,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.66061 samples/s/p 0:49:49 } +2024-07-30 05:20:33,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1012/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 1.2742358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:33,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.65942 samples/s/p 0:49:46 } +2024-07-30 05:20:36,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1014/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 1.271933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:36,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.65618 samples/s/p 0:49:45 } +2024-07-30 05:20:39,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1016/ 3125], loss: 0.141, per_step_time: 1413ms, lr: 1.2696316e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:39,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.65772 samples/s/p 0:49:42 } +2024-07-30 05:20:42,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1018/ 3125], loss: 0.217, per_step_time: 1414ms, lr: 1.2673321e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:42,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.65764 samples/s/p 0:49:39 } +2024-07-30 05:20:45,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1020/ 3125], loss: 0.304, per_step_time: 1414ms, lr: 1.2650338e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:45,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.65745 samples/s/p 0:49:36 } +2024-07-30 05:20:48,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1022/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 1.2627381e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:48,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.65809 samples/s/p 0:49:33 } +2024-07-30 05:20:51,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1024/ 3125], loss: 0.189, per_step_time: 1414ms, lr: 1.2604439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:51,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.65551 samples/s/p 0:49:31 } +2024-07-30 05:20:53,840 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1026/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 1.2581515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:53,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.66051 samples/s/p 0:49:26 } +2024-07-30 05:20:56,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1028/ 3125], loss: 0.138, per_step_time: 1415ms, lr: 1.2558612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:56,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.65120 samples/s/p 0:49:28 } +2024-07-30 05:20:59,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1030/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 1.2535721e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:59,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.66076 samples/s/p 0:49:20 } +2024-07-30 05:21:02,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1032/ 3125], loss: 0.270, per_step_time: 1414ms, lr: 1.2512851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:02,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.65506 samples/s/p 0:49:20 } +2024-07-30 05:21:05,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1034/ 3125], loss: 0.368, per_step_time: 1413ms, lr: 1.2489995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:05,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.66044 samples/s/p 0:49:15 } +2024-07-30 05:21:08,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1036/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 1.2467151e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:08,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.66040 samples/s/p 0:49:12 } +2024-07-30 05:21:10,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1038/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 1.2444335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:10,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.66066 samples/s/p 0:49:09 } +2024-07-30 05:21:13,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1040/ 3125], loss: 0.436, per_step_time: 1412ms, lr: 1.2421536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:13,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.66177 samples/s/p 0:49:06 } +2024-07-30 05:21:16,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1042/ 3125], loss: 0.456, per_step_time: 1413ms, lr: 1.2398758e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:16,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.65851 samples/s/p 0:49:04 } +2024-07-30 05:21:19,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1044/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 1.2375996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:19,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.66072 samples/s/p 0:49:00 } +2024-07-30 05:21:22,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1046/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 1.2353253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:22,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.66074 samples/s/p 0:48:58 } +2024-07-30 05:21:25,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1048/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 1.2330526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:25,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.65846 samples/s/p 0:48:56 } +2024-07-30 05:21:27,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1050/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 1.2307808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:27,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.66138 samples/s/p 0:48:52 } +2024-07-30 05:21:30,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1052/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 1.2285119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:30,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.65907 samples/s/p 0:48:50 } +2024-07-30 05:21:33,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1054/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 1.2262445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:33,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.65999 samples/s/p 0:48:47 } +2024-07-30 05:21:36,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1056/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 1.2239792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:36,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.65952 samples/s/p 0:48:44 } +2024-07-30 05:21:39,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1058/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 1.2217149e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:39,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.65922 samples/s/p 0:48:41 } +2024-07-30 05:21:42,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1060/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 1.2194532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:42,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.66009 samples/s/p 0:48:38 } +2024-07-30 05:21:44,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1062/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 1.2171932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:44,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.65951 samples/s/p 0:48:36 } +2024-07-30 05:21:47,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1064/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 1.214934e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:47,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |███████████████████████████████████████ | 5.66033 samples/s/p 0:48:32 } +2024-07-30 05:21:50,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1066/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 1.2126776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:50,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |███████████████████████████████████████ | 5.65953 samples/s/p 0:48:30 } +2024-07-30 05:21:53,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1068/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 1.2104231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:53,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.65877 samples/s/p 0:48:28 } +2024-07-30 05:21:56,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1070/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 1.2081704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:56,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.65940 samples/s/p 0:48:24 } +2024-07-30 05:21:59,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1072/ 3125], loss: 0.303, per_step_time: 1414ms, lr: 1.2059196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:59,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.65705 samples/s/p 0:48:23 } +2024-07-30 05:22:01,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1074/ 3125], loss: 0.290, per_step_time: 1415ms, lr: 1.2036704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:01,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.65358 samples/s/p 0:48:22 } +2024-07-30 05:22:04,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1076/ 3125], loss: 0.046, per_step_time: 1412ms, lr: 1.2014228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:04,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.66230 samples/s/p 0:48:14 } +2024-07-30 05:22:07,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1078/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 1.1991766e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:07,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.65953 samples/s/p 0:48:13 } +2024-07-30 05:22:10,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1080/ 3125], loss: 0.406, per_step_time: 1415ms, lr: 1.1969328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:10,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.65289 samples/s/p 0:48:14 } +2024-07-30 05:22:13,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1082/ 3125], loss: 0.318, per_step_time: 1414ms, lr: 1.1946902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:13,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.65677 samples/s/p 0:48:09 } +2024-07-30 05:22:16,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1084/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 1.1924502e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:16,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.66129 samples/s/p 0:48:04 } +2024-07-30 05:22:18,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1086/ 3125], loss: 0.321, per_step_time: 1413ms, lr: 1.1902121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:18,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.66120 samples/s/p 0:48:01 } +2024-07-30 05:22:21,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1088/ 3125], loss: 0.171, per_step_time: 1415ms, lr: 1.1879754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:21,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.65296 samples/s/p 0:48:02 } +2024-07-30 05:22:24,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1090/ 3125], loss: 0.352, per_step_time: 1414ms, lr: 1.1857411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:24,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.65727 samples/s/p 0:47:57 } +2024-07-30 05:22:27,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1092/ 3125], loss: 0.198, per_step_time: 1414ms, lr: 1.1835074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:27,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.65651 samples/s/p 0:47:55 } +2024-07-30 05:22:30,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1094/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 1.1812764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:30,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.66164 samples/s/p 0:47:49 } +2024-07-30 05:22:33,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1096/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 1.1790472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:33,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.66130 samples/s/p 0:47:47 } +2024-07-30 05:22:35,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1098/ 3125], loss: 0.470, per_step_time: 1414ms, lr: 1.1768198e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:35,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.65462 samples/s/p 0:47:47 } +2024-07-30 05:22:38,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1100/ 3125], loss: 0.447, per_step_time: 1413ms, lr: 1.1745944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:38,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.66166 samples/s/p 0:47:41 } +2024-07-30 05:22:41,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1102/ 3125], loss: 0.428, per_step_time: 1413ms, lr: 1.1723699e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:41,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.66066 samples/s/p 0:47:39 } +2024-07-30 05:22:44,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1104/ 3125], loss: 0.231, per_step_time: 1412ms, lr: 1.1701483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:44,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.66271 samples/s/p 0:47:35 } +2024-07-30 05:22:47,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1106/ 3125], loss: 0.515, per_step_time: 1413ms, lr: 1.167928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:47,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.65919 samples/s/p 0:47:34 } +2024-07-30 05:22:50,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1108/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 1.1657089e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:50,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.65930 samples/s/p 0:47:31 } +2024-07-30 05:22:52,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1110/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 1.1634928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:52,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.65843 samples/s/p 0:47:28 } +2024-07-30 05:22:55,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1112/ 3125], loss: 0.417, per_step_time: 1415ms, lr: 1.1612782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:55,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.65233 samples/s/p 0:47:29 } +2024-07-30 05:22:58,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1114/ 3125], loss: 0.305, per_step_time: 1414ms, lr: 1.1590654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:58,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.65374 samples/s/p 0:47:25 } +2024-07-30 05:23:01,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1116/ 3125], loss: 0.349, per_step_time: 1414ms, lr: 1.1568549e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:01,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.65743 samples/s/p 0:47:20 } +2024-07-30 05:23:04,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1118/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 1.1546457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:04,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.65929 samples/s/p 0:47:17 } +2024-07-30 05:23:07,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1120/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 1.1524385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:07,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.66028 samples/s/p 0:47:13 } +2024-07-30 05:23:09,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1122/ 3125], loss: 0.327, per_step_time: 1413ms, lr: 1.1502325e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:09,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.66040 samples/s/p 0:47:10 } +2024-07-30 05:23:12,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1124/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 1.1480287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:12,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.66005 samples/s/p 0:47:08 } +2024-07-30 05:23:15,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1126/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 1.1458262e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:15,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.66144 samples/s/p 0:47:04 } +2024-07-30 05:23:18,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1128/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 1.1436265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:18,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.66043 samples/s/p 0:47:02 } +2024-07-30 05:23:21,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1130/ 3125], loss: 0.113, per_step_time: 1412ms, lr: 1.1414284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:21,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.66196 samples/s/p 0:46:58 } +2024-07-30 05:23:24,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1132/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 1.1392325e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:24,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.65981 samples/s/p 0:46:57 } +2024-07-30 05:23:26,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1134/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 1.1370381e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:26,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.65899 samples/s/p 0:46:54 } +2024-07-30 05:23:29,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1136/ 3125], loss: 0.082, per_step_time: 1412ms, lr: 1.1348446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:29,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.66214 samples/s/p 0:46:50 } +2024-07-30 05:23:32,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1138/ 3125], loss: 0.260, per_step_time: 1414ms, lr: 1.1326542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:32,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.65720 samples/s/p 0:46:49 } +2024-07-30 05:23:35,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1140/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 1.1304655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:35,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.66161 samples/s/p 0:46:44 } +2024-07-30 05:23:38,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1142/ 3125], loss: 0.176, per_step_time: 1413ms, lr: 1.1282783e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:38,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.66147 samples/s/p 0:46:42 } +2024-07-30 05:23:41,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1144/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 1.1260936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:41,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.65659 samples/s/p 0:46:41 } +2024-07-30 05:23:43,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1146/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 1.1239093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:43,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.66018 samples/s/p 0:46:37 } +2024-07-30 05:23:46,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1148/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 1.1217281e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:46,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.65552 samples/s/p 0:46:36 } +2024-07-30 05:23:49,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1150/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 1.1195477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:49,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.65828 samples/s/p 0:46:32 } +2024-07-30 05:23:52,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1152/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 1.1173704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:52,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.66098 samples/s/p 0:46:28 } +2024-07-30 05:23:55,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1154/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 1.1151942e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:55,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.66135 samples/s/p 0:46:25 } +2024-07-30 05:23:58,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1156/ 3125], loss: 0.473, per_step_time: 1413ms, lr: 1.1130204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:58,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.66085 samples/s/p 0:46:22 } +2024-07-30 05:24:00,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1158/ 3125], loss: 0.317, per_step_time: 1414ms, lr: 1.1108484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:00,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.65743 samples/s/p 0:46:21 } +2024-07-30 05:24:03,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1160/ 3125], loss: 0.223, per_step_time: 1416ms, lr: 1.1086782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:03,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.64658 samples/s/p 0:46:23 } +2024-07-30 05:24:06,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1162/ 3125], loss: 0.360, per_step_time: 1414ms, lr: 1.1065096e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:06,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.65510 samples/s/p 0:46:16 } +2024-07-30 05:24:09,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1164/ 3125], loss: 0.130, per_step_time: 1413ms, lr: 1.1043423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:09,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.66127 samples/s/p 0:46:11 } +2024-07-30 05:24:12,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1166/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 1.1021775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:12,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.65922 samples/s/p 0:46:09 } +2024-07-30 05:24:15,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1168/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 1.1000147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:15,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.65911 samples/s/p 0:46:06 } +2024-07-30 05:24:17,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1170/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 1.0978531e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:17,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.66038 samples/s/p 0:46:03 } +2024-07-30 05:24:20,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1172/ 3125], loss: 0.636, per_step_time: 1413ms, lr: 1.0956943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:20,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.65856 samples/s/p 0:46:01 } +2024-07-30 05:24:23,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1174/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 1.0935369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:23,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.65830 samples/s/p 0:45:58 } +2024-07-30 05:24:26,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1176/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 1.0913816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:26,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.66036 samples/s/p 0:45:54 } +2024-07-30 05:24:29,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1178/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 1.0892278e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:29,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.65886 samples/s/p 0:45:52 } +2024-07-30 05:24:32,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1180/ 3125], loss: 0.293, per_step_time: 1417ms, lr: 1.0870757e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:32,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.64539 samples/s/p 0:45:56 } +2024-07-30 05:24:34,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1182/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 1.0849258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:34,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.65970 samples/s/p 0:45:46 } +2024-07-30 05:24:37,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1184/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 1.082778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:37,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.65937 samples/s/p 0:45:43 } +2024-07-30 05:24:40,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1186/ 3125], loss: 0.209, per_step_time: 1415ms, lr: 1.0806319e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:40,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.65250 samples/s/p 0:45:44 } +2024-07-30 05:24:43,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1188/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 1.0784879e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:43,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.65805 samples/s/p 0:45:38 } +2024-07-30 05:24:46,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1190/ 3125], loss: 0.440, per_step_time: 1413ms, lr: 1.0763446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:46,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.66159 samples/s/p 0:45:34 } +2024-07-30 05:24:49,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1192/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 1.0742044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:49,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.65996 samples/s/p 0:45:32 } +2024-07-30 05:24:51,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1194/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 1.0720652e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:51,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.66078 samples/s/p 0:45:28 } +2024-07-30 05:24:54,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1196/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 1.0699284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:54,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.65953 samples/s/p 0:45:26 } +2024-07-30 05:24:57,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1198/ 3125], loss: 0.130, per_step_time: 1414ms, lr: 1.0677936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:57,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.65627 samples/s/p 0:45:25 } +2024-07-30 05:25:00,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1200/ 3125], loss: 0.418, per_step_time: 1414ms, lr: 1.0656607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:00,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.65738 samples/s/p 0:45:22 } +2024-07-30 05:25:03,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1202/ 3125], loss: 0.381, per_step_time: 1414ms, lr: 1.0635296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:03,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.65384 samples/s/p 0:45:20 } +2024-07-30 05:25:06,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1204/ 3125], loss: 0.090, per_step_time: 1416ms, lr: 1.0614004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:06,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.64737 samples/s/p 0:45:21 } +2024-07-30 05:25:08,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1206/ 3125], loss: 0.344, per_step_time: 1416ms, lr: 1.0592731e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:08,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.64632 samples/s/p 0:45:18 } +2024-07-30 05:25:11,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1208/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 1.0571473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:11,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.66070 samples/s/p 0:45:09 } +2024-07-30 05:25:14,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1210/ 3125], loss: 0.137, per_step_time: 1412ms, lr: 1.055024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:14,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.66206 samples/s/p 0:45:05 } +2024-07-30 05:25:17,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1212/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 1.0529023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:17,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.66007 samples/s/p 0:45:03 } +2024-07-30 05:25:20,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1214/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 1.0507816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:20,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.66069 samples/s/p 0:45:00 } +2024-07-30 05:25:23,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1216/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 1.0486639e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:23,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.65974 samples/s/p 0:44:58 } +2024-07-30 05:25:25,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1218/ 3125], loss: 0.406, per_step_time: 1413ms, lr: 1.0465478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:25,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.65960 samples/s/p 0:44:55 } +2024-07-30 05:25:28,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1220/ 3125], loss: 0.091, per_step_time: 1413ms, lr: 1.0444339e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:28,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.66119 samples/s/p 0:44:52 } +2024-07-30 05:25:31,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1222/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 1.0423207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:31,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.65806 samples/s/p 0:44:50 } +2024-07-30 05:25:34,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1224/ 3125], loss: 0.416, per_step_time: 1412ms, lr: 1.0402107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:34,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.66175 samples/s/p 0:44:46 } +2024-07-30 05:25:37,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1226/ 3125], loss: 0.082, per_step_time: 1413ms, lr: 1.0381021e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:37,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.66115 samples/s/p 0:44:43 } +2024-07-30 05:25:40,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1228/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 1.0359954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:40,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.66051 samples/s/p 0:44:41 } +2024-07-30 05:25:42,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1230/ 3125], loss: 0.169, per_step_time: 1412ms, lr: 1.0338911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:42,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.66300 samples/s/p 0:44:37 } +2024-07-30 05:25:45,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1232/ 3125], loss: 0.450, per_step_time: 1413ms, lr: 1.0317883e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:45,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.65978 samples/s/p 0:44:35 } +2024-07-30 05:25:48,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1234/ 3125], loss: 0.128, per_step_time: 1414ms, lr: 1.0296869e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:48,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.65752 samples/s/p 0:44:33 } +2024-07-30 05:25:51,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1236/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 1.0275876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:51,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.65985 samples/s/p 0:44:30 } +2024-07-30 05:25:54,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1238/ 3125], loss: 0.423, per_step_time: 1416ms, lr: 1.0254902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:54,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.64856 samples/s/p 0:44:32 } +2024-07-30 05:25:57,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1240/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 1.023395e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:57,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.66092 samples/s/p 0:44:23 } +2024-07-30 05:25:59,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1242/ 3125], loss: 0.130, per_step_time: 1412ms, lr: 1.0213017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:59,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.66175 samples/s/p 0:44:20 } +2024-07-30 05:26:02,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1244/ 3125], loss: 0.291, per_step_time: 1413ms, lr: 1.0192105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:02,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.65944 samples/s/p 0:44:18 } +2024-07-30 05:26:05,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1246/ 3125], loss: 0.129, per_step_time: 1414ms, lr: 1.0171208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:05,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |███████████████████████████████████████ | 5.65612 samples/s/p 0:44:17 } +2024-07-30 05:26:08,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1248/ 3125], loss: 0.165, per_step_time: 1415ms, lr: 1.0150334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:08,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |███████████████████████████████████████ | 5.65307 samples/s/p 0:44:16 } +2024-07-30 05:26:11,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1250/ 3125], loss: 0.405, per_step_time: 1413ms, lr: 1.0129478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:11,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.65991 samples/s/p 0:44:10 } +2024-07-30 05:26:14,140 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1252/ 3125], loss: 0.290, per_step_time: 1414ms, lr: 1.0108635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:14,140 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.65709 samples/s/p 0:44:08 } +2024-07-30 05:26:16,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1254/ 3125], loss: 0.194, per_step_time: 1415ms, lr: 1.0087817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:16,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.65062 samples/s/p 0:44:08 } +2024-07-30 05:26:19,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1256/ 3125], loss: 0.357, per_step_time: 1414ms, lr: 1.0067016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:19,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.65744 samples/s/p 0:44:02 } +2024-07-30 05:26:22,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1258/ 3125], loss: 0.241, per_step_time: 1414ms, lr: 1.0046228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:22,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.65678 samples/s/p 0:44:00 } +2024-07-30 05:26:25,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1260/ 3125], loss: 0.385, per_step_time: 1413ms, lr: 1.0025468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:25,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.66046 samples/s/p 0:43:55 } +2024-07-30 05:26:28,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1262/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 1.0004726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:28,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.65928 samples/s/p 0:43:53 } +2024-07-30 05:26:31,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1264/ 3125], loss: 0.344, per_step_time: 1414ms, lr: 9.984001e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:31,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.65423 samples/s/p 0:43:53 } +2024-07-30 05:26:33,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1266/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 9.963288e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:33,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.65970 samples/s/p 0:43:47 } +2024-07-30 05:26:36,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1268/ 3125], loss: 0.256, per_step_time: 1412ms, lr: 9.942609e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:36,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.66299 samples/s/p 0:43:43 } +2024-07-30 05:26:39,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1270/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 9.921941e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:39,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.66020 samples/s/p 0:43:41 } +2024-07-30 05:26:42,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1272/ 3125], loss: 0.419, per_step_time: 1419ms, lr: 9.901294e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:42,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.63532 samples/s/p 0:43:50 } +2024-07-30 05:26:45,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1274/ 3125], loss: 0.539, per_step_time: 1413ms, lr: 9.880667e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:45,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.66007 samples/s/p 0:43:36 } +2024-07-30 05:26:48,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1276/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 9.86006e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:48,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.66042 samples/s/p 0:43:33 } +2024-07-30 05:26:50,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1278/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 9.839463e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:50,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.66042 samples/s/p 0:43:30 } +2024-07-30 05:26:53,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1280/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 9.818893e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:53,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.66065 samples/s/p 0:43:27 } +2024-07-30 05:26:56,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1282/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 9.798335e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:56,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.65807 samples/s/p 0:43:25 } +2024-07-30 05:26:59,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1284/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 9.777805e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:59,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.65998 samples/s/p 0:43:22 } +2024-07-30 05:27:02,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1286/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 9.757292e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:02,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.66058 samples/s/p 0:43:19 } +2024-07-30 05:27:05,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1288/ 3125], loss: 0.435, per_step_time: 1413ms, lr: 9.7368e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:05,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.66044 samples/s/p 0:43:16 } +2024-07-30 05:27:08,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1290/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 9.716326e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:08,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.66054 samples/s/p 0:43:13 } +2024-07-30 05:27:10,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1292/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 9.695873e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:10,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.66007 samples/s/p 0:43:10 } +2024-07-30 05:27:13,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1294/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 9.675427e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:13,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.66023 samples/s/p 0:43:07 } +2024-07-30 05:27:16,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1296/ 3125], loss: 0.406, per_step_time: 1413ms, lr: 9.655014e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:16,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.66016 samples/s/p 0:43:05 } +2024-07-30 05:27:19,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1298/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 9.634616e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:19,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.66022 samples/s/p 0:43:02 } +2024-07-30 05:27:22,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1300/ 3125], loss: 0.304, per_step_time: 1412ms, lr: 9.614238e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:22,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.66314 samples/s/p 0:42:58 } +2024-07-30 05:27:25,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1302/ 3125], loss: 0.200, per_step_time: 1415ms, lr: 9.593874e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:25,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.65276 samples/s/p 0:42:59 } +2024-07-30 05:27:27,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1304/ 3125], loss: 0.065, per_step_time: 1412ms, lr: 9.573533e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:27,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.66190 samples/s/p 0:42:52 } +2024-07-30 05:27:30,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1306/ 3125], loss: 0.232, per_step_time: 1414ms, lr: 9.553214e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:30,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.65755 samples/s/p 0:42:52 } +2024-07-30 05:27:33,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1308/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 9.532913e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:33,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.65523 samples/s/p 0:42:50 } +2024-07-30 05:27:36,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1310/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 9.512627e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:36,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.65786 samples/s/p 0:42:46 } +2024-07-30 05:27:39,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1312/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 9.4923644e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:39,178 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.66096 samples/s/p 0:42:42 } +2024-07-30 05:27:42,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1314/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 9.4721196e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:42,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.65991 samples/s/p 0:42:39 } +2024-07-30 05:27:44,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1316/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 9.4518987e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:44,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.66120 samples/s/p 0:42:36 } +2024-07-30 05:27:47,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1318/ 3125], loss: 0.449, per_step_time: 1413ms, lr: 9.4316925e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:47,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.66072 samples/s/p 0:42:33 } +2024-07-30 05:27:50,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1320/ 3125], loss: 0.109, per_step_time: 1412ms, lr: 9.4115137e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:50,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.66177 samples/s/p 0:42:30 } +2024-07-30 05:27:53,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1322/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 9.391346e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:53,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.65883 samples/s/p 0:42:28 } +2024-07-30 05:27:56,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1324/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 9.371191e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:56,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.66111 samples/s/p 0:42:25 } +2024-07-30 05:27:59,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1326/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 9.3510596e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:59,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.65861 samples/s/p 0:42:23 } +2024-07-30 05:28:01,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1328/ 3125], loss: 0.412, per_step_time: 1413ms, lr: 9.330952e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:01,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.66008 samples/s/p 0:42:19 } +2024-07-30 05:28:04,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1330/ 3125], loss: 0.522, per_step_time: 1414ms, lr: 9.310865e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:04,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.65669 samples/s/p 0:42:18 } +2024-07-30 05:28:07,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1332/ 3125], loss: 0.282, per_step_time: 1415ms, lr: 9.2907993e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:07,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.65361 samples/s/p 0:42:17 } +2024-07-30 05:28:10,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1334/ 3125], loss: 0.511, per_step_time: 1413ms, lr: 9.270751e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:10,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.65937 samples/s/p 0:42:11 } +2024-07-30 05:28:13,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1336/ 3125], loss: 0.386, per_step_time: 1414ms, lr: 9.2507213e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:13,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.65575 samples/s/p 0:42:10 } +2024-07-30 05:28:16,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1338/ 3125], loss: 0.166, per_step_time: 1414ms, lr: 9.230703e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:16,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.65727 samples/s/p 0:42:07 } +2024-07-30 05:28:18,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1340/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 9.2107143e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:18,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.65883 samples/s/p 0:42:03 } +2024-07-30 05:28:21,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1342/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 9.190744e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:21,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.65824 samples/s/p 0:42:00 } +2024-07-30 05:28:24,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1344/ 3125], loss: 0.151, per_step_time: 1413ms, lr: 9.1707915e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:24,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.65993 samples/s/p 0:41:57 } +2024-07-30 05:28:27,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1346/ 3125], loss: 0.495, per_step_time: 1413ms, lr: 9.1508593e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:27,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.66113 samples/s/p 0:41:53 } +2024-07-30 05:28:30,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1348/ 3125], loss: 0.077, per_step_time: 1413ms, lr: 9.1309425e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:30,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.66107 samples/s/p 0:41:51 } +2024-07-30 05:28:33,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1350/ 3125], loss: 0.083, per_step_time: 1412ms, lr: 9.1110496e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:33,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.66180 samples/s/p 0:41:48 } +2024-07-30 05:28:35,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1352/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 9.0911686e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:35,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.65927 samples/s/p 0:41:46 } +2024-07-30 05:28:38,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1354/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 9.071317e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:38,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.65943 samples/s/p 0:41:43 } +2024-07-30 05:28:41,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1356/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 9.0514806e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:41,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.65950 samples/s/p 0:41:40 } +2024-07-30 05:28:44,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1358/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 9.0316684e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:44,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.66004 samples/s/p 0:41:37 } +2024-07-30 05:28:47,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1360/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 9.011873e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:47,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.66111 samples/s/p 0:41:34 } +2024-07-30 05:28:50,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1362/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 8.992097e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:50,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.65885 samples/s/p 0:41:32 } +2024-07-30 05:28:52,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1364/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 8.972341e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:52,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.65927 samples/s/p 0:41:29 } +2024-07-30 05:28:55,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1366/ 3125], loss: 0.187, per_step_time: 1414ms, lr: 8.9526e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:55,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.65703 samples/s/p 0:41:27 } +2024-07-30 05:28:58,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1368/ 3125], loss: 0.402, per_step_time: 1414ms, lr: 8.9328825e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:58,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.65697 samples/s/p 0:41:24 } +2024-07-30 05:29:01,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1370/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 8.913186e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:01,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.66163 samples/s/p 0:41:19 } +2024-07-30 05:29:04,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1372/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 8.8935013e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:04,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.65961 samples/s/p 0:41:17 } +2024-07-30 05:29:07,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1374/ 3125], loss: 0.073, per_step_time: 1413ms, lr: 8.873841e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:07,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.66059 samples/s/p 0:41:14 } +2024-07-30 05:29:09,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1376/ 3125], loss: 0.277, per_step_time: 1412ms, lr: 8.854207e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:09,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.66361 samples/s/p 0:41:10 } +2024-07-30 05:29:12,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1378/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.834588e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:12,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.66141 samples/s/p 0:41:08 } +2024-07-30 05:29:15,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1380/ 3125], loss: 0.412, per_step_time: 1412ms, lr: 8.8149875e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:15,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.66215 samples/s/p 0:41:05 } +2024-07-30 05:29:18,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1382/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 8.795401e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:18,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.66005 samples/s/p 0:41:03 } +2024-07-30 05:29:21,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1384/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 8.7758417e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:21,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.66054 samples/s/p 0:41:00 } +2024-07-30 05:29:24,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1386/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 8.7563006e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:24,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.65812 samples/s/p 0:40:58 } +2024-07-30 05:29:26,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1388/ 3125], loss: 0.225, per_step_time: 1412ms, lr: 8.736783e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:26,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.66283 samples/s/p 0:40:53 } +2024-07-30 05:29:29,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1390/ 3125], loss: 0.344, per_step_time: 1413ms, lr: 8.7172805e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:29,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.65966 samples/s/p 0:40:52 } +2024-07-30 05:29:32,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1392/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 8.697793e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:32,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.66074 samples/s/p 0:40:49 } +2024-07-30 05:29:35,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1394/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 8.678335e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:35,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.65982 samples/s/p 0:40:46 } +2024-07-30 05:29:38,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1396/ 3125], loss: 0.372, per_step_time: 1414ms, lr: 8.658886e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:38,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.65667 samples/s/p 0:40:45 } +2024-07-30 05:29:41,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1398/ 3125], loss: 0.180, per_step_time: 1414ms, lr: 8.6394635e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:41,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.65455 samples/s/p 0:40:43 } +2024-07-30 05:29:43,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1400/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 8.620065e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:43,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.66010 samples/s/p 0:40:38 } +2024-07-30 05:29:46,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1402/ 3125], loss: 0.256, per_step_time: 1415ms, lr: 8.6006816e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:46,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.65264 samples/s/p 0:40:38 } +2024-07-30 05:29:49,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1404/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 8.581319e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:49,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.66130 samples/s/p 0:40:31 } +2024-07-30 05:29:52,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1406/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 8.5619746e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:52,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.65863 samples/s/p 0:40:30 } +2024-07-30 05:29:55,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1408/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 8.5426535e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:55,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.66072 samples/s/p 0:40:26 } +2024-07-30 05:29:58,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1410/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 8.523345e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:58,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.65854 samples/s/p 0:40:24 } +2024-07-30 05:30:00,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1412/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 8.5040597e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:00,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.66029 samples/s/p 0:40:21 } +2024-07-30 05:30:03,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1414/ 3125], loss: 0.133, per_step_time: 1414ms, lr: 8.4847983e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:03,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.65546 samples/s/p 0:40:20 } +2024-07-30 05:30:06,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1416/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 8.4655494e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:06,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.65903 samples/s/p 0:40:15 } +2024-07-30 05:30:09,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1418/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 8.446324e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:09,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.65996 samples/s/p 0:40:12 } +2024-07-30 05:30:12,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1420/ 3125], loss: 0.274, per_step_time: 1425ms, lr: 8.427119e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:12,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.61121 samples/s/p 0:40:30 } +2024-07-30 05:30:15,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1422/ 3125], loss: 0.061, per_step_time: 1412ms, lr: 8.407938e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:15,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.66191 samples/s/p 0:40:06 } +2024-07-30 05:30:17,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1424/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 8.3887664e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:17,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.66015 samples/s/p 0:40:04 } +2024-07-30 05:30:20,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1426/ 3125], loss: 0.204, per_step_time: 1414ms, lr: 8.3696216e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:20,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.65435 samples/s/p 0:40:03 } +2024-07-30 05:30:23,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1428/ 3125], loss: 0.108, per_step_time: 1413ms, lr: 8.3505e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:23,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.66091 samples/s/p 0:39:58 } +2024-07-30 05:30:26,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1430/ 3125], loss: 0.045, per_step_time: 1414ms, lr: 8.331391e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:26,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.65743 samples/s/p 0:39:56 } +2024-07-30 05:30:29,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1432/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 8.3123115e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:29,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.66028 samples/s/p 0:39:52 } +2024-07-30 05:30:32,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1434/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 8.293244e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:32,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |████████████████████████████████████████ | 5.66016 samples/s/p 0:39:50 } +2024-07-30 05:30:34,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1436/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 8.2741946e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:34,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |████████████████████████████████████████ | 5.65885 samples/s/p 0:39:47 } +2024-07-30 05:30:37,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1438/ 3125], loss: 0.568, per_step_time: 1414ms, lr: 8.2551685e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:37,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.65725 samples/s/p 0:39:45 } +2024-07-30 05:30:40,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1440/ 3125], loss: 0.192, per_step_time: 1412ms, lr: 8.236155e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:40,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.66174 samples/s/p 0:39:40 } +2024-07-30 05:30:43,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1442/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 8.217174e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:43,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.66039 samples/s/p 0:39:38 } +2024-07-30 05:30:46,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1444/ 3125], loss: 0.327, per_step_time: 1413ms, lr: 8.1982074e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:46,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.66025 samples/s/p 0:39:35 } +2024-07-30 05:30:49,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1446/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 8.179262e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:49,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.66119 samples/s/p 0:39:32 } +2024-07-30 05:30:51,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1448/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 8.160338e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:51,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.65973 samples/s/p 0:39:30 } +2024-07-30 05:30:54,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1450/ 3125], loss: 0.391, per_step_time: 1413ms, lr: 8.141431e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:54,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.66128 samples/s/p 0:39:26 } +2024-07-30 05:30:57,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1452/ 3125], loss: 0.133, per_step_time: 1417ms, lr: 8.1225454e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:57,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.64563 samples/s/p 0:39:30 } +2024-07-30 05:31:00,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1454/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 8.1036774e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:00,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.65952 samples/s/p 0:39:22 } +2024-07-30 05:31:03,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1456/ 3125], loss: 0.208, per_step_time: 1412ms, lr: 8.0848275e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:03,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.66264 samples/s/p 0:39:17 } +2024-07-30 05:31:06,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1458/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 8.0660044e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:06,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.66154 samples/s/p 0:39:15 } +2024-07-30 05:31:08,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1460/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 8.047193e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:08,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.65937 samples/s/p 0:39:13 } +2024-07-30 05:31:11,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1462/ 3125], loss: 0.264, per_step_time: 1414ms, lr: 8.028409e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:11,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.65716 samples/s/p 0:39:11 } +2024-07-30 05:31:14,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1464/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 8.0096453e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:14,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.66151 samples/s/p 0:39:07 } +2024-07-30 05:31:17,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1466/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 7.9908966e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:17,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.65816 samples/s/p 0:39:05 } +2024-07-30 05:31:20,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1468/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 7.9721656e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:20,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.66097 samples/s/p 0:39:01 } +2024-07-30 05:31:23,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1470/ 3125], loss: 0.457, per_step_time: 1413ms, lr: 7.9534647e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:23,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.65868 samples/s/p 0:38:59 } +2024-07-30 05:31:25,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1472/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 7.9347785e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:25,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.66124 samples/s/p 0:38:55 } +2024-07-30 05:31:28,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1474/ 3125], loss: 0.316, per_step_time: 1415ms, lr: 7.916108e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:28,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.65265 samples/s/p 0:38:56 } +2024-07-30 05:31:31,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1476/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 7.8974665e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:31,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.65796 samples/s/p 0:38:51 } +2024-07-30 05:31:34,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1478/ 3125], loss: 0.465, per_step_time: 1414ms, lr: 7.87884e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:34,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.65688 samples/s/p 0:38:49 } +2024-07-30 05:31:37,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1480/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 7.860231e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:37,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.65821 samples/s/p 0:38:45 } +2024-07-30 05:31:40,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1482/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 7.841646e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:40,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.65800 samples/s/p 0:38:43 } +2024-07-30 05:31:42,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1484/ 3125], loss: 0.245, per_step_time: 1414ms, lr: 7.8230767e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:42,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.65651 samples/s/p 0:38:40 } +2024-07-30 05:31:45,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1486/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 7.804531e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:45,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.65995 samples/s/p 0:38:36 } +2024-07-30 05:31:48,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1488/ 3125], loss: 0.317, per_step_time: 1415ms, lr: 7.7860085e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:48,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.65343 samples/s/p 0:38:36 } +2024-07-30 05:31:51,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1490/ 3125], loss: 0.481, per_step_time: 1412ms, lr: 7.767504e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:51,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.66298 samples/s/p 0:38:29 } +2024-07-30 05:31:54,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1492/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 7.7490176e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:54,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.66029 samples/s/p 0:38:28 } +2024-07-30 05:31:57,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1494/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 7.7305555e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:57,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.65818 samples/s/p 0:38:26 } +2024-07-30 05:31:59,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1496/ 3125], loss: 0.301, per_step_time: 1413ms, lr: 7.7121075e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:59,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.66123 samples/s/p 0:38:21 } +2024-07-30 05:32:02,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1498/ 3125], loss: 0.152, per_step_time: 1412ms, lr: 7.693684e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:02,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.66193 samples/s/p 0:38:18 } +2024-07-30 05:32:05,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1500/ 3125], loss: 0.262, per_step_time: 1415ms, lr: 7.675281e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:05,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.64983 samples/s/p 0:38:20 } +2024-07-30 05:32:08,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1502/ 3125], loss: 0.083, per_step_time: 1413ms, lr: 7.656899e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:08,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.66111 samples/s/p 0:38:13 } +2024-07-30 05:32:11,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1504/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 7.6385317e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:11,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.66164 samples/s/p 0:38:10 } +2024-07-30 05:32:14,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1506/ 3125], loss: 0.193, per_step_time: 1414ms, lr: 7.6201883e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:14,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.65621 samples/s/p 0:38:09 } +2024-07-30 05:32:16,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1508/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 7.601866e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:16,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.66105 samples/s/p 0:38:05 } +2024-07-30 05:32:19,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1510/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 7.583564e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:19,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.65904 samples/s/p 0:38:03 } +2024-07-30 05:32:22,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1512/ 3125], loss: 0.093, per_step_time: 1413ms, lr: 7.5652775e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:22,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.65909 samples/s/p 0:38:00 } +2024-07-30 05:32:25,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1514/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 7.547015e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:25,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.66105 samples/s/p 0:37:56 } +2024-07-30 05:32:28,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1516/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 7.5287755e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:28,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.65989 samples/s/p 0:37:54 } +2024-07-30 05:32:31,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1518/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 7.5105544e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:31,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.65999 samples/s/p 0:37:51 } +2024-07-30 05:32:33,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1520/ 3125], loss: 0.386, per_step_time: 1412ms, lr: 7.492354e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:33,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.66265 samples/s/p 0:37:47 } +2024-07-30 05:32:36,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1522/ 3125], loss: 0.440, per_step_time: 1413ms, lr: 7.474175e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:36,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.65816 samples/s/p 0:37:46 } +2024-07-30 05:32:39,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1524/ 3125], loss: 0.357, per_step_time: 1413ms, lr: 7.4560074e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:39,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.65911 samples/s/p 0:37:43 } +2024-07-30 05:32:42,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1526/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 7.43787e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:42,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.66103 samples/s/p 0:37:39 } +2024-07-30 05:32:45,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1528/ 3125], loss: 0.246, per_step_time: 1414ms, lr: 7.419744e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:45,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.65717 samples/s/p 0:37:38 } +2024-07-30 05:32:48,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1530/ 3125], loss: 0.320, per_step_time: 1413ms, lr: 7.401645e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:48,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.65994 samples/s/p 0:37:34 } +2024-07-30 05:32:50,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1532/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 7.383564e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:50,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.65931 samples/s/p 0:37:31 } +2024-07-30 05:32:53,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1534/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 7.3655065e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:53,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.66081 samples/s/p 0:37:28 } +2024-07-30 05:32:56,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1536/ 3125], loss: 0.302, per_step_time: 1412ms, lr: 7.3474706e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:56,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.66314 samples/s/p 0:37:24 } +2024-07-30 05:32:59,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1538/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 7.3294547e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:59,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.66093 samples/s/p 0:37:22 } +2024-07-30 05:33:02,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1540/ 3125], loss: 0.191, per_step_time: 1414ms, lr: 7.311451e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:02,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.65760 samples/s/p 0:37:21 } +2024-07-30 05:33:05,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1542/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 7.2934745e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:05,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.65997 samples/s/p 0:37:17 } +2024-07-30 05:33:07,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1544/ 3125], loss: 0.098, per_step_time: 1413ms, lr: 7.2755154e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:07,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.66025 samples/s/p 0:37:14 } +2024-07-30 05:33:10,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1546/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 7.2575807e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:10,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.65851 samples/s/p 0:37:12 } +2024-07-30 05:33:13,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1548/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 7.23966e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:13,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.66089 samples/s/p 0:37:08 } +2024-07-30 05:33:16,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1550/ 3125], loss: 0.208, per_step_time: 1414ms, lr: 7.221764e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:16,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.65703 samples/s/p 0:37:07 } +2024-07-30 05:33:19,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1552/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 7.2038887e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:19,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.65885 samples/s/p 0:37:03 } +2024-07-30 05:33:22,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1554/ 3125], loss: 0.220, per_step_time: 1414ms, lr: 7.186028e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:22,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.65747 samples/s/p 0:37:01 } +2024-07-30 05:33:24,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1556/ 3125], loss: 0.212, per_step_time: 1412ms, lr: 7.168197e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:24,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.66285 samples/s/p 0:36:56 } +2024-07-30 05:33:27,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1558/ 3125], loss: 0.151, per_step_time: 1425ms, lr: 7.1503814e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:27,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.61239 samples/s/p 0:37:13 } +2024-07-30 05:33:30,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1560/ 3125], loss: 0.207, per_step_time: 1412ms, lr: 7.1325894e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:30,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.66290 samples/s/p 0:36:50 } +2024-07-30 05:33:33,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1562/ 3125], loss: 0.316, per_step_time: 1414ms, lr: 7.1148185e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:33,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.65701 samples/s/p 0:36:50 } +2024-07-30 05:33:36,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1564/ 3125], loss: 0.232, per_step_time: 1414ms, lr: 7.097065e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:36,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.65434 samples/s/p 0:36:48 } +2024-07-30 05:33:39,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1566/ 3125], loss: 0.191, per_step_time: 1414ms, lr: 7.079333e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:39,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.65742 samples/s/p 0:36:44 } +2024-07-30 05:33:41,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1568/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 7.061618e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:41,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.66050 samples/s/p 0:36:40 } +2024-07-30 05:33:44,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1570/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 7.043928e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:44,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.66032 samples/s/p 0:36:37 } +2024-07-30 05:33:47,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1572/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 7.026252e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:47,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.65997 samples/s/p 0:36:35 } +2024-07-30 05:33:50,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1574/ 3125], loss: 0.055, per_step_time: 1413ms, lr: 7.008603e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:50,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.66145 samples/s/p 0:36:31 } +2024-07-30 05:33:53,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1576/ 3125], loss: 0.414, per_step_time: 1412ms, lr: 6.990972e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:53,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.66190 samples/s/p 0:36:28 } +2024-07-30 05:33:56,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1578/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 6.973365e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:56,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.65942 samples/s/p 0:36:26 } +2024-07-30 05:33:58,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1580/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 6.9557757e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:58,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.65961 samples/s/p 0:36:23 } +2024-07-30 05:34:01,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1582/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 6.93821e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:01,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.65930 samples/s/p 0:36:21 } +2024-07-30 05:34:04,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1584/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 6.920656e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:04,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.66162 samples/s/p 0:36:17 } +2024-07-30 05:34:07,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1586/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 6.9031324e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:07,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.66084 samples/s/p 0:36:14 } +2024-07-30 05:34:10,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1588/ 3125], loss: 0.271, per_step_time: 1416ms, lr: 6.8856235e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:10,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.64722 samples/s/p 0:36:17 } +2024-07-30 05:34:13,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1590/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 6.868142e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:13,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.66109 samples/s/p 0:36:09 } +2024-07-30 05:34:16,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1592/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 6.8506716e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:16,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.66031 samples/s/p 0:36:06 } +2024-07-30 05:34:18,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1594/ 3125], loss: 0.330, per_step_time: 1414ms, lr: 6.833228e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:18,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.65511 samples/s/p 0:36:05 } +2024-07-30 05:34:21,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1596/ 3125], loss: 0.382, per_step_time: 1412ms, lr: 6.8158056e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:21,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.66227 samples/s/p 0:36:00 } +2024-07-30 05:34:24,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1598/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 6.7983956e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:24,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.65846 samples/s/p 0:35:58 } +2024-07-30 05:34:27,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1600/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 6.7810146e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:27,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.66151 samples/s/p 0:35:54 } +2024-07-30 05:34:30,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1602/ 3125], loss: 0.294, per_step_time: 1414ms, lr: 6.763652e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:30,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.65769 samples/s/p 0:35:53 } +2024-07-30 05:34:33,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1604/ 3125], loss: 0.324, per_step_time: 1414ms, lr: 6.74631e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:33,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.65721 samples/s/p 0:35:50 } +2024-07-30 05:34:35,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1606/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 6.7289915e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:35,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.65915 samples/s/p 0:35:47 } +2024-07-30 05:34:38,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1608/ 3125], loss: 0.196, per_step_time: 1414ms, lr: 6.711691e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:38,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.65645 samples/s/p 0:35:45 } +2024-07-30 05:34:41,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1610/ 3125], loss: 0.134, per_step_time: 1413ms, lr: 6.694412e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:41,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.66170 samples/s/p 0:35:40 } +2024-07-30 05:34:44,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1612/ 3125], loss: 0.206, per_step_time: 1415ms, lr: 6.67715e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:44,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.65173 samples/s/p 0:35:41 } +2024-07-30 05:34:47,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1614/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 6.659913e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:47,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.65979 samples/s/p 0:35:35 } +2024-07-30 05:34:50,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1616/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 6.64269e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:50,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.66169 samples/s/p 0:35:32 } +2024-07-30 05:34:52,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1618/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 6.6254944e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:52,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.65940 samples/s/p 0:35:30 } +2024-07-30 05:34:55,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1620/ 3125], loss: 0.217, per_step_time: 1412ms, lr: 6.608319e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:55,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.66227 samples/s/p 0:35:26 } +2024-07-30 05:34:58,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1622/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 6.591165e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:58,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |█████████████████████████████████████████ | 5.66150 samples/s/p 0:35:23 } +2024-07-30 05:35:01,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1624/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 6.574032e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:01,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |█████████████████████████████████████████ | 5.65882 samples/s/p 0:35:21 } +2024-07-30 05:35:04,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1626/ 3125], loss: 0.105, per_step_time: 1414ms, lr: 6.55691e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:04,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.65750 samples/s/p 0:35:19 } +2024-07-30 05:35:07,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1628/ 3125], loss: 0.344, per_step_time: 1415ms, lr: 6.5398183e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:07,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.65358 samples/s/p 0:35:18 } +2024-07-30 05:35:09,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1630/ 3125], loss: 0.373, per_step_time: 1417ms, lr: 6.5227505e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:09,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.64371 samples/s/p 0:35:19 } +2024-07-30 05:35:12,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1632/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 6.505698e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:12,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.66024 samples/s/p 0:35:10 } +2024-07-30 05:35:15,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1634/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 6.488666e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:15,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.65859 samples/s/p 0:35:07 } +2024-07-30 05:35:18,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1636/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 6.471661e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:18,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.65939 samples/s/p 0:35:04 } +2024-07-30 05:35:21,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1638/ 3125], loss: 0.127, per_step_time: 1413ms, lr: 6.4546646e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:21,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.66117 samples/s/p 0:35:01 } +2024-07-30 05:35:24,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1640/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 6.4376917e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:24,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.65881 samples/s/p 0:34:59 } +2024-07-30 05:35:26,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1642/ 3125], loss: 0.100, per_step_time: 1413ms, lr: 6.420746e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:26,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.66078 samples/s/p 0:34:55 } +2024-07-30 05:35:29,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1644/ 3125], loss: 0.177, per_step_time: 1415ms, lr: 6.4038187e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:29,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.65269 samples/s/p 0:34:55 } +2024-07-30 05:35:32,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1646/ 3125], loss: 0.263, per_step_time: 1412ms, lr: 6.386912e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:32,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.66184 samples/s/p 0:34:49 } +2024-07-30 05:35:35,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1648/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 6.3700315e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:35,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.65996 samples/s/p 0:34:47 } +2024-07-30 05:35:38,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1650/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 6.3531667e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:38,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.65969 samples/s/p 0:34:44 } +2024-07-30 05:35:41,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1652/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 6.336322e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:41,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.66058 samples/s/p 0:34:41 } +2024-07-30 05:35:43,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1654/ 3125], loss: 0.257, per_step_time: 1412ms, lr: 6.319502e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:43,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.66214 samples/s/p 0:34:38 } +2024-07-30 05:35:46,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1656/ 3125], loss: 0.157, per_step_time: 1412ms, lr: 6.3026965e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:46,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.66270 samples/s/p 0:34:35 } +2024-07-30 05:35:49,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1658/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 6.285912e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:49,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.65817 samples/s/p 0:34:34 } +2024-07-30 05:35:52,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1660/ 3125], loss: 0.242, per_step_time: 1412ms, lr: 6.269154e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:52,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.66244 samples/s/p 0:34:29 } +2024-07-30 05:35:55,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1662/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 6.2524106e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:55,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.66122 samples/s/p 0:34:27 } +2024-07-30 05:35:58,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1664/ 3125], loss: 0.147, per_step_time: 1415ms, lr: 6.2356946e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:58,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.65166 samples/s/p 0:34:28 } +2024-07-30 05:36:00,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1666/ 3125], loss: 0.201, per_step_time: 1412ms, lr: 6.2189963e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:00,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.66177 samples/s/p 0:34:21 } +2024-07-30 05:36:03,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1668/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 6.202322e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:03,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.65836 samples/s/p 0:34:19 } +2024-07-30 05:36:06,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1670/ 3125], loss: 0.194, per_step_time: 1414ms, lr: 6.1856593e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:06,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.65637 samples/s/p 0:34:17 } +2024-07-30 05:36:09,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1672/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 6.169027e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:09,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.65816 samples/s/p 0:34:14 } +2024-07-30 05:36:12,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1674/ 3125], loss: 0.211, per_step_time: 1414ms, lr: 6.152415e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:12,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.65731 samples/s/p 0:34:11 } +2024-07-30 05:36:15,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1676/ 3125], loss: 0.320, per_step_time: 1414ms, lr: 6.135824e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:15,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.65736 samples/s/p 0:34:09 } +2024-07-30 05:36:17,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1678/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 6.119251e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:17,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.66069 samples/s/p 0:34:04 } +2024-07-30 05:36:20,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1680/ 3125], loss: 0.404, per_step_time: 1412ms, lr: 6.1026986e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:20,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.66220 samples/s/p 0:34:01 } +2024-07-30 05:36:23,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1682/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 6.0861674e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:23,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.65824 samples/s/p 0:34:00 } +2024-07-30 05:36:26,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1684/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 6.069654e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:26,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.66002 samples/s/p 0:33:56 } +2024-07-30 05:36:29,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1686/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 6.053165e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:29,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.66103 samples/s/p 0:33:53 } +2024-07-30 05:36:32,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1688/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 6.036699e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:32,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.66143 samples/s/p 0:33:50 } +2024-07-30 05:36:34,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1690/ 3125], loss: 0.472, per_step_time: 1412ms, lr: 6.0202535e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:34,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.66222 samples/s/p 0:33:47 } +2024-07-30 05:36:37,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1692/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 6.003827e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:37,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.66067 samples/s/p 0:33:45 } +2024-07-30 05:36:40,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1694/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 5.9874264e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:40,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.66065 samples/s/p 0:33:42 } +2024-07-30 05:36:43,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1696/ 3125], loss: 0.134, per_step_time: 1412ms, lr: 5.971044e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:43,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.66244 samples/s/p 0:33:38 } +2024-07-30 05:36:46,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1698/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 5.9546767e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:46,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.65971 samples/s/p 0:33:37 } +2024-07-30 05:36:49,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1700/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 5.938336e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:49,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.65952 samples/s/p 0:33:34 } +2024-07-30 05:36:51,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1702/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 5.922016e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:51,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.65841 samples/s/p 0:33:31 } +2024-07-30 05:36:54,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1704/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 5.9057203e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:54,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.65833 samples/s/p 0:33:29 } +2024-07-30 05:36:57,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1706/ 3125], loss: 0.215, per_step_time: 1414ms, lr: 5.8894364e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:57,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.65529 samples/s/p 0:33:27 } +2024-07-30 05:37:00,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1708/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 5.8731825e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:00,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.65961 samples/s/p 0:33:22 } +2024-07-30 05:37:03,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1710/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 5.856946e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:03,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.65944 samples/s/p 0:33:20 } +2024-07-30 05:37:06,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1712/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 5.8407306e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:06,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.65864 samples/s/p 0:33:17 } +2024-07-30 05:37:08,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1714/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 5.824533e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:08,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.65952 samples/s/p 0:33:14 } +2024-07-30 05:37:11,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1716/ 3125], loss: 0.192, per_step_time: 1414ms, lr: 5.8083623e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:11,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.65502 samples/s/p 0:33:13 } +2024-07-30 05:37:14,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1718/ 3125], loss: 0.193, per_step_time: 1414ms, lr: 5.792209e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:14,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.65499 samples/s/p 0:33:10 } +2024-07-30 05:37:17,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1720/ 3125], loss: 0.420, per_step_time: 1413ms, lr: 5.7760803e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:17,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.65792 samples/s/p 0:33:06 } +2024-07-30 05:37:20,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1722/ 3125], loss: 0.260, per_step_time: 1414ms, lr: 5.759972e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:20,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.65722 samples/s/p 0:33:04 } +2024-07-30 05:37:23,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1724/ 3125], loss: 0.136, per_step_time: 1414ms, lr: 5.7438876e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:23,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.65411 samples/s/p 0:33:02 } +2024-07-30 05:37:25,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1726/ 3125], loss: 0.655, per_step_time: 1415ms, lr: 5.7278123e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:25,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.65298 samples/s/p 0:32:59 } +2024-07-30 05:37:28,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1728/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 5.71177e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:28,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.66073 samples/s/p 0:32:54 } +2024-07-30 05:37:31,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1730/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 5.6957424e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:31,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.66042 samples/s/p 0:32:51 } +2024-07-30 05:37:34,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1732/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 5.6797353e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:34,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.66061 samples/s/p 0:32:48 } +2024-07-30 05:37:37,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1734/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 5.6637555e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:37,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.65995 samples/s/p 0:32:46 } +2024-07-30 05:37:40,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1736/ 3125], loss: 0.166, per_step_time: 1412ms, lr: 5.647793e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:40,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.66222 samples/s/p 0:32:42 } +2024-07-30 05:37:42,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1738/ 3125], loss: 0.089, per_step_time: 1413ms, lr: 5.631855e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:42,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.66057 samples/s/p 0:32:40 } +2024-07-30 05:37:45,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1740/ 3125], loss: 0.575, per_step_time: 1412ms, lr: 5.6159377e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:45,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.66220 samples/s/p 0:32:36 } +2024-07-30 05:37:48,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1742/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 5.600035e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:48,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.66016 samples/s/p 0:32:34 } +2024-07-30 05:37:51,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1744/ 3125], loss: 0.258, per_step_time: 1412ms, lr: 5.5841593e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:51,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.66171 samples/s/p 0:32:31 } +2024-07-30 05:37:54,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1746/ 3125], loss: 0.254, per_step_time: 1412ms, lr: 5.5683046e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:54,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.66305 samples/s/p 0:32:28 } +2024-07-30 05:37:57,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1748/ 3125], loss: 0.137, per_step_time: 1413ms, lr: 5.5524737e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:57,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.65820 samples/s/p 0:32:26 } +2024-07-30 05:37:59,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1750/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 5.536655e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:59,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.66062 samples/s/p 0:32:23 } +2024-07-30 05:38:02,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1752/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 5.5208653e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:02,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.66115 samples/s/p 0:32:20 } +2024-07-30 05:38:05,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1754/ 3125], loss: 0.277, per_step_time: 1412ms, lr: 5.505097e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:05,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.66214 samples/s/p 0:32:17 } +2024-07-30 05:38:08,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1756/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 5.4893405e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:08,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.65886 samples/s/p 0:32:15 } +2024-07-30 05:38:11,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1758/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 5.4736165e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:11,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.65953 samples/s/p 0:32:12 } +2024-07-30 05:38:14,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1760/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 5.457908e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:14,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.66130 samples/s/p 0:32:08 } +2024-07-30 05:38:16,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1762/ 3125], loss: 0.158, per_step_time: 1414ms, lr: 5.442223e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:16,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.65767 samples/s/p 0:32:07 } +2024-07-30 05:38:19,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1764/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 5.4265615e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:19,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.65959 samples/s/p 0:32:03 } +2024-07-30 05:38:22,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1766/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 5.4109216e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:22,589 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.66131 samples/s/p 0:32:00 } +2024-07-30 05:38:25,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1768/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 5.395296e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:25,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.66070 samples/s/p 0:31:57 } +2024-07-30 05:38:28,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1770/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 5.379692e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:28,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.66099 samples/s/p 0:31:54 } +2024-07-30 05:38:31,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1772/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 5.364117e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:31,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.66055 samples/s/p 0:31:52 } +2024-07-30 05:38:33,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1774/ 3125], loss: 0.285, per_step_time: 1414ms, lr: 5.3485513e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:33,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.65768 samples/s/p 0:31:50 } +2024-07-30 05:38:36,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1776/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 5.333021e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:36,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.66113 samples/s/p 0:31:46 } +2024-07-30 05:38:39,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1778/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 5.317503e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:39,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.65934 samples/s/p 0:31:44 } +2024-07-30 05:38:42,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1780/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 5.302012e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:42,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.65827 samples/s/p 0:31:41 } +2024-07-30 05:38:45,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1782/ 3125], loss: 0.191, per_step_time: 1415ms, lr: 5.2865414e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:45,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.65326 samples/s/p 0:31:40 } +2024-07-30 05:38:48,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1784/ 3125], loss: 0.450, per_step_time: 1413ms, lr: 5.271089e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:48,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.66066 samples/s/p 0:31:35 } +2024-07-30 05:38:50,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1786/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 5.2556544e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:50,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.66100 samples/s/p 0:31:32 } +2024-07-30 05:38:53,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1788/ 3125], loss: 0.179, per_step_time: 1414ms, lr: 5.240249e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:53,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.65456 samples/s/p 0:31:31 } +2024-07-30 05:38:56,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1790/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 5.2248623e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:56,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.66084 samples/s/p 0:31:26 } +2024-07-30 05:38:59,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1792/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 5.2094964e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:59,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.66057 samples/s/p 0:31:23 } +2024-07-30 05:39:02,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1794/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 5.194148e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:02,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.65846 samples/s/p 0:31:21 } +2024-07-30 05:39:05,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1796/ 3125], loss: 0.381, per_step_time: 1414ms, lr: 5.178827e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:05,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.65764 samples/s/p 0:31:19 } +2024-07-30 05:39:07,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1798/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 5.1635266e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:07,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.66078 samples/s/p 0:31:15 } +2024-07-30 05:39:10,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1800/ 3125], loss: 0.104, per_step_time: 1413ms, lr: 5.1482436e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:10,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.65801 samples/s/p 0:31:13 } +2024-07-30 05:39:13,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1802/ 3125], loss: 0.427, per_step_time: 1414ms, lr: 5.132985e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:13,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.65723 samples/s/p 0:31:10 } +2024-07-30 05:39:16,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1804/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 5.11775e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:16,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.66043 samples/s/p 0:31:06 } +2024-07-30 05:39:19,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1806/ 3125], loss: 0.253, per_step_time: 1414ms, lr: 5.102533e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:19,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.65458 samples/s/p 0:31:06 } +2024-07-30 05:39:22,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1808/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 5.08734e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:22,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.65815 samples/s/p 0:31:02 } +2024-07-30 05:39:24,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1810/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 5.072167e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:24,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.65945 samples/s/p 0:30:58 } +2024-07-30 05:39:27,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1812/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 5.057019e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:27,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.65984 samples/s/p 0:30:55 } +2024-07-30 05:39:30,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1814/ 3125], loss: 0.128, per_step_time: 1414ms, lr: 5.0418885e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:30,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |███████████████████████████████████████████ | 5.65499 samples/s/p 0:30:54 } +2024-07-30 05:39:33,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1816/ 3125], loss: 0.300, per_step_time: 1414ms, lr: 5.0267784e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:33,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |███████████████████████████████████████████ | 5.65671 samples/s/p 0:30:51 } +2024-07-30 05:39:36,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1818/ 3125], loss: 0.304, per_step_time: 1414ms, lr: 5.0116836e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:36,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.65531 samples/s/p 0:30:48 } +2024-07-30 05:39:39,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1820/ 3125], loss: 0.252, per_step_time: 1415ms, lr: 4.996621e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:39,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.65224 samples/s/p 0:30:47 } +2024-07-30 05:39:41,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1822/ 3125], loss: 0.149, per_step_time: 1414ms, lr: 4.981577e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:41,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.65380 samples/s/p 0:30:43 } +2024-07-30 05:39:44,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1824/ 3125], loss: 0.332, per_step_time: 1414ms, lr: 4.966557e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:44,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.65592 samples/s/p 0:30:40 } +2024-07-30 05:39:47,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1826/ 3125], loss: 0.327, per_step_time: 1414ms, lr: 4.9515575e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:47,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.65575 samples/s/p 0:30:37 } +2024-07-30 05:39:50,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1828/ 3125], loss: 0.129, per_step_time: 1415ms, lr: 4.936573e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:50,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.65017 samples/s/p 0:30:36 } +2024-07-30 05:39:53,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1830/ 3125], loss: 0.336, per_step_time: 1414ms, lr: 4.921615e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:53,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.65416 samples/s/p 0:30:32 } +2024-07-30 05:39:56,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1832/ 3125], loss: 0.366, per_step_time: 1414ms, lr: 4.906681e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:56,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.65388 samples/s/p 0:30:29 } +2024-07-30 05:39:58,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1834/ 3125], loss: 0.434, per_step_time: 1414ms, lr: 4.891765e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:58,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.65513 samples/s/p 0:30:26 } +2024-07-30 05:40:01,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1836/ 3125], loss: 0.215, per_step_time: 1415ms, lr: 4.8768726e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:01,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.65291 samples/s/p 0:30:24 } +2024-07-30 05:40:04,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1838/ 3125], loss: 0.347, per_step_time: 1416ms, lr: 4.8619955e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:04,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.64946 samples/s/p 0:30:22 } +2024-07-30 05:40:07,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1840/ 3125], loss: 0.267, per_step_time: 1414ms, lr: 4.847148e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:07,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.65423 samples/s/p 0:30:18 } +2024-07-30 05:40:10,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1842/ 3125], loss: 0.263, per_step_time: 1414ms, lr: 4.8323153e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:10,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.65713 samples/s/p 0:30:14 } +2024-07-30 05:40:13,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1844/ 3125], loss: 0.343, per_step_time: 1414ms, lr: 4.8175065e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:13,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.65622 samples/s/p 0:30:11 } +2024-07-30 05:40:15,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1846/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 4.802728e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:15,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.65935 samples/s/p 0:30:07 } +2024-07-30 05:40:18,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1848/ 3125], loss: 0.143, per_step_time: 1412ms, lr: 4.7879604e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:18,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.66189 samples/s/p 0:30:04 } +2024-07-30 05:40:21,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1850/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 4.7732203e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:21,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.66002 samples/s/p 0:30:02 } +2024-07-30 05:40:24,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1852/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 4.758501e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:24,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.65950 samples/s/p 0:29:59 } +2024-07-30 05:40:27,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1854/ 3125], loss: 0.448, per_step_time: 1413ms, lr: 4.7438024e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:27,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.66124 samples/s/p 0:29:56 } +2024-07-30 05:40:30,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1856/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 4.7291277e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:30,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.66107 samples/s/p 0:29:53 } +2024-07-30 05:40:32,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1858/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 4.714465e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:32,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.65831 samples/s/p 0:29:51 } +2024-07-30 05:40:35,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1860/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 4.699832e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:35,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.65885 samples/s/p 0:29:48 } +2024-07-30 05:40:38,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1862/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 4.685214e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:38,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.65781 samples/s/p 0:29:45 } +2024-07-30 05:40:41,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1864/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 4.670626e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:41,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.65884 samples/s/p 0:29:42 } +2024-07-30 05:40:44,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1866/ 3125], loss: 0.310, per_step_time: 1414ms, lr: 4.6560555e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:44,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.65673 samples/s/p 0:29:40 } +2024-07-30 05:40:47,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1868/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 4.641509e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:47,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.65802 samples/s/p 0:29:37 } +2024-07-30 05:40:50,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1870/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 4.6269832e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:50,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.65778 samples/s/p 0:29:34 } +2024-07-30 05:40:52,840 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1872/ 3125], loss: 0.387, per_step_time: 1413ms, lr: 4.6124725e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:52,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.66116 samples/s/p 0:29:30 } +2024-07-30 05:40:55,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1874/ 3125], loss: 0.357, per_step_time: 1413ms, lr: 4.5979917e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:55,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.66102 samples/s/p 0:29:27 } +2024-07-30 05:40:58,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1876/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 4.5835316e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:58,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.66091 samples/s/p 0:29:25 } +2024-07-30 05:41:01,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1878/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 4.5690953e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:01,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.66069 samples/s/p 0:29:22 } +2024-07-30 05:41:04,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1880/ 3125], loss: 0.405, per_step_time: 1413ms, lr: 4.554677e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:04,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.65902 samples/s/p 0:29:20 } +2024-07-30 05:41:07,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1882/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 4.5402763e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:07,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.65939 samples/s/p 0:29:17 } +2024-07-30 05:41:09,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1884/ 3125], loss: 0.185, per_step_time: 1414ms, lr: 4.5259057e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:09,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.65553 samples/s/p 0:29:15 } +2024-07-30 05:41:12,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1886/ 3125], loss: 0.212, per_step_time: 1414ms, lr: 4.51155e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:12,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.65382 samples/s/p 0:29:13 } +2024-07-30 05:41:15,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1888/ 3125], loss: 0.370, per_step_time: 1414ms, lr: 4.497218e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:15,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.65612 samples/s/p 0:29:09 } +2024-07-30 05:41:18,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1890/ 3125], loss: 0.436, per_step_time: 1413ms, lr: 4.482907e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:18,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.66118 samples/s/p 0:29:05 } +2024-07-30 05:41:21,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1892/ 3125], loss: 0.427, per_step_time: 1413ms, lr: 4.4686226e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:21,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.65978 samples/s/p 0:29:02 } +2024-07-30 05:41:24,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1894/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 4.4543594e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:24,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.65831 samples/s/p 0:29:00 } +2024-07-30 05:41:26,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1896/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 4.440114e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:26,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.65849 samples/s/p 0:28:57 } +2024-07-30 05:41:29,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1898/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 4.4258923e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:29,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.65946 samples/s/p 0:28:54 } +2024-07-30 05:41:32,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1900/ 3125], loss: 0.282, per_step_time: 1425ms, lr: 4.4116854e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:32,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.61381 samples/s/p 0:29:05 } +2024-07-30 05:41:35,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1902/ 3125], loss: 0.268, per_step_time: 1413ms, lr: 4.3975083e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:35,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.66054 samples/s/p 0:28:48 } +2024-07-30 05:41:38,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1904/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 4.3833552e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:38,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.66007 samples/s/p 0:28:45 } +2024-07-30 05:41:41,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1906/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 4.369217e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:41,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.66119 samples/s/p 0:28:42 } +2024-07-30 05:41:43,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1908/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 4.3550997e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:43,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.66017 samples/s/p 0:28:40 } +2024-07-30 05:41:46,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1910/ 3125], loss: 0.236, per_step_time: 1412ms, lr: 4.3410122e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:46,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.66179 samples/s/p 0:28:36 } +2024-07-30 05:41:49,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1912/ 3125], loss: 0.141, per_step_time: 1413ms, lr: 4.3269455e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:49,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.65943 samples/s/p 0:28:34 } +2024-07-30 05:41:52,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1914/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 4.3128907e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:52,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.66133 samples/s/p 0:28:31 } +2024-07-30 05:41:55,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1916/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 4.2988657e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:55,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.66028 samples/s/p 0:28:28 } +2024-07-30 05:41:58,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1918/ 3125], loss: 0.416, per_step_time: 1413ms, lr: 4.2848615e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:58,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.66165 samples/s/p 0:28:25 } +2024-07-30 05:42:00,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1920/ 3125], loss: 0.474, per_step_time: 1413ms, lr: 4.2708783e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:00,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.66150 samples/s/p 0:28:22 } +2024-07-30 05:42:03,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1922/ 3125], loss: 0.104, per_step_time: 1413ms, lr: 4.2569218e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:03,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.66074 samples/s/p 0:28:20 } +2024-07-30 05:42:06,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1924/ 3125], loss: 0.437, per_step_time: 1413ms, lr: 4.2429835e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:06,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.65954 samples/s/p 0:28:17 } +2024-07-30 05:42:09,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1926/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 4.2290628e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:09,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.65800 samples/s/p 0:28:15 } +2024-07-30 05:42:12,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1928/ 3125], loss: 0.454, per_step_time: 1413ms, lr: 4.215169e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:12,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.66112 samples/s/p 0:28:11 } +2024-07-30 05:42:15,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1930/ 3125], loss: 0.215, per_step_time: 1412ms, lr: 4.20129e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:15,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.66227 samples/s/p 0:28:08 } +2024-07-30 05:42:17,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1932/ 3125], loss: 0.346, per_step_time: 1412ms, lr: 4.1874407e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:17,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.66292 samples/s/p 0:28:05 } +2024-07-30 05:42:20,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1934/ 3125], loss: 0.110, per_step_time: 1414ms, lr: 4.1736124e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:20,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.65617 samples/s/p 0:28:04 } +2024-07-30 05:42:23,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1936/ 3125], loss: 0.433, per_step_time: 1413ms, lr: 4.159802e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:23,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.65824 samples/s/p 0:28:01 } +2024-07-30 05:42:26,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1938/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 4.1460186e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:26,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.65799 samples/s/p 0:27:58 } +2024-07-30 05:42:29,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1940/ 3125], loss: 0.112, per_step_time: 1413ms, lr: 4.132256e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:29,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.66168 samples/s/p 0:27:54 } +2024-07-30 05:42:32,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1942/ 3125], loss: 0.137, per_step_time: 1416ms, lr: 4.118514e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:32,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.64866 samples/s/p 0:27:55 } +2024-07-30 05:42:34,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1944/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 4.10479e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:34,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.65879 samples/s/p 0:27:49 } +2024-07-30 05:42:37,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1946/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 4.091096e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:37,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.65951 samples/s/p 0:27:46 } +2024-07-30 05:42:40,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1948/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 4.0774196e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:40,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.66105 samples/s/p 0:27:43 } +2024-07-30 05:42:43,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1950/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 4.063761e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:43,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.65849 samples/s/p 0:27:41 } +2024-07-30 05:42:46,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1952/ 3125], loss: 0.390, per_step_time: 1413ms, lr: 4.0501297e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:46,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.65961 samples/s/p 0:27:38 } +2024-07-30 05:42:49,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1954/ 3125], loss: 0.410, per_step_time: 1413ms, lr: 4.0365188e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:49,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.66048 samples/s/p 0:27:34 } +2024-07-30 05:42:51,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1956/ 3125], loss: 0.320, per_step_time: 1412ms, lr: 4.0229318e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:51,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.66224 samples/s/p 0:27:31 } +2024-07-30 05:42:54,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1958/ 3125], loss: 0.266, per_step_time: 1412ms, lr: 4.00936e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:54,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.66245 samples/s/p 0:27:28 } +2024-07-30 05:42:57,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1960/ 3125], loss: 0.147, per_step_time: 1418ms, lr: 3.995821e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:57,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.63859 samples/s/p 0:27:32 } +2024-07-30 05:43:00,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1962/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 3.9822964e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:00,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.65958 samples/s/p 0:27:23 } +2024-07-30 05:43:03,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1964/ 3125], loss: 0.287, per_step_time: 1412ms, lr: 3.968799e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:03,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.66359 samples/s/p 0:27:19 } +2024-07-30 05:43:06,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1966/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 3.9553166e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:06,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.66049 samples/s/p 0:27:18 } +2024-07-30 05:43:08,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1968/ 3125], loss: 0.158, per_step_time: 1413ms, lr: 3.9418606e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:08,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.66049 samples/s/p 0:27:15 } +2024-07-30 05:43:11,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1970/ 3125], loss: 0.176, per_step_time: 1413ms, lr: 3.9284288e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:11,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.65817 samples/s/p 0:27:13 } +2024-07-30 05:43:14,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1972/ 3125], loss: 0.169, per_step_time: 1413ms, lr: 3.9150117e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:14,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.65931 samples/s/p 0:27:09 } +2024-07-30 05:43:17,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1974/ 3125], loss: 0.306, per_step_time: 1415ms, lr: 3.9016186e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:17,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.65297 samples/s/p 0:27:08 } +2024-07-30 05:43:20,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1976/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 3.888252e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:20,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.65943 samples/s/p 0:27:04 } +2024-07-30 05:43:23,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1978/ 3125], loss: 0.349, per_step_time: 1413ms, lr: 3.874904e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:23,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.65956 samples/s/p 0:27:01 } +2024-07-30 05:43:25,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1980/ 3125], loss: 0.322, per_step_time: 1412ms, lr: 3.8615792e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:25,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.66213 samples/s/p 0:26:57 } +2024-07-30 05:43:28,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1982/ 3125], loss: 0.388, per_step_time: 1414ms, lr: 3.8482784e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:28,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.65696 samples/s/p 0:26:56 } +2024-07-30 05:43:31,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1984/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 3.8349955e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:31,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.66003 samples/s/p 0:26:52 } +2024-07-30 05:43:34,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1986/ 3125], loss: 0.249, per_step_time: 1416ms, lr: 3.8217425e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:34,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.64841 samples/s/p 0:26:53 } +2024-07-30 05:43:37,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1988/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 3.8085014e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:37,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.66105 samples/s/p 0:26:46 } +2024-07-30 05:43:40,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1990/ 3125], loss: 0.203, per_step_time: 1415ms, lr: 3.795287e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:40,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.65340 samples/s/p 0:26:46 } +2024-07-30 05:43:42,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1992/ 3125], loss: 0.162, per_step_time: 1412ms, lr: 3.7820934e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:42,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.66245 samples/s/p 0:26:40 } +2024-07-30 05:43:45,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1994/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 3.7689267e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:45,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.65880 samples/s/p 0:26:38 } +2024-07-30 05:43:48,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1996/ 3125], loss: 0.317, per_step_time: 1414ms, lr: 3.755772e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:48,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |███████████████████████████████████████████ | 5.65717 samples/s/p 0:26:36 } +2024-07-30 05:43:51,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1998/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 3.7426472e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:51,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |███████████████████████████████████████████ | 5.65773 samples/s/p 0:26:33 } +2024-07-30 05:43:54,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2000/ 3125], loss: 0.219, per_step_time: 1414ms, lr: 3.729546e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:54,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.65718 samples/s/p 0:26:30 } +2024-07-30 05:43:57,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2002/ 3125], loss: 0.322, per_step_time: 1414ms, lr: 3.7164597e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:57,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.65645 samples/s/p 0:26:28 } +2024-07-30 05:43:59,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2004/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 3.7034005e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:59,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.66138 samples/s/p 0:26:24 } +2024-07-30 05:44:02,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2006/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 3.690362e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:02,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.65885 samples/s/p 0:26:21 } +2024-07-30 05:44:05,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2008/ 3125], loss: 0.410, per_step_time: 1412ms, lr: 3.677347e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:05,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.66253 samples/s/p 0:26:18 } +2024-07-30 05:44:08,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2010/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 3.6643564e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:08,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.66092 samples/s/p 0:26:15 } +2024-07-30 05:44:11,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2012/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 3.6513865e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:11,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.65777 samples/s/p 0:26:13 } +2024-07-30 05:44:14,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2014/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 3.6384372e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:14,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.66114 samples/s/p 0:26:10 } +2024-07-30 05:44:16,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2016/ 3125], loss: 0.380, per_step_time: 1412ms, lr: 3.625506e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:16,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.66305 samples/s/p 0:26:06 } +2024-07-30 05:44:19,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2018/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 3.6126016e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:19,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.65901 samples/s/p 0:26:04 } +2024-07-30 05:44:22,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2020/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 3.599718e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:22,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.66137 samples/s/p 0:26:01 } +2024-07-30 05:44:25,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2022/ 3125], loss: 0.103, per_step_time: 1413ms, lr: 3.5868555e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:25,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.66015 samples/s/p 0:25:58 } +2024-07-30 05:44:28,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2024/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 3.5740166e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:28,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.66169 samples/s/p 0:25:55 } +2024-07-30 05:44:31,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2026/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 3.5612015e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:31,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.65988 samples/s/p 0:25:53 } +2024-07-30 05:44:33,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2028/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 3.5484044e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:33,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.66030 samples/s/p 0:25:50 } +2024-07-30 05:44:36,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2030/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 3.535631e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:36,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.65775 samples/s/p 0:25:48 } +2024-07-30 05:44:39,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2032/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 3.5228848e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:39,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.66008 samples/s/p 0:25:44 } +2024-07-30 05:44:42,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2034/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 3.5101561e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:42,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.66112 samples/s/p 0:25:41 } +2024-07-30 05:44:45,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2036/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 3.4974514e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:45,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.66022 samples/s/p 0:25:39 } +2024-07-30 05:44:48,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2038/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 3.4847704e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:48,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.65870 samples/s/p 0:25:36 } +2024-07-30 05:44:50,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2040/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 3.4721046e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:50,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.65962 samples/s/p 0:25:33 } +2024-07-30 05:44:53,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2042/ 3125], loss: 0.288, per_step_time: 1414ms, lr: 3.4594655e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:53,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.65658 samples/s/p 0:25:31 } +2024-07-30 05:44:56,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2044/ 3125], loss: 0.271, per_step_time: 1414ms, lr: 3.446847e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:56,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.65754 samples/s/p 0:25:28 } +2024-07-30 05:44:59,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2046/ 3125], loss: 0.145, per_step_time: 1414ms, lr: 3.4342526e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:59,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.65707 samples/s/p 0:25:25 } +2024-07-30 05:45:02,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2048/ 3125], loss: 0.373, per_step_time: 1412ms, lr: 3.421682e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:02,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.66222 samples/s/p 0:25:21 } +2024-07-30 05:45:05,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2050/ 3125], loss: 0.396, per_step_time: 1413ms, lr: 3.4091323e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:05,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.65984 samples/s/p 0:25:19 } +2024-07-30 05:45:07,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2052/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 3.3966063e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:07,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.65957 samples/s/p 0:25:16 } +2024-07-30 05:45:10,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2054/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 3.3841013e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:10,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.65931 samples/s/p 0:25:13 } +2024-07-30 05:45:13,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2056/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 3.3716202e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:13,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.66086 samples/s/p 0:25:10 } +2024-07-30 05:45:16,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2058/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 3.3591598e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:16,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.65740 samples/s/p 0:25:08 } +2024-07-30 05:45:19,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2060/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 3.3467143e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:19,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.65954 samples/s/p 0:25:05 } +2024-07-30 05:45:22,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2062/ 3125], loss: 0.276, per_step_time: 1418ms, lr: 3.3342985e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:22,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.64056 samples/s/p 0:25:07 } +2024-07-30 05:45:24,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2064/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 3.321907e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:24,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.66168 samples/s/p 0:24:59 } +2024-07-30 05:45:27,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2066/ 3125], loss: 0.146, per_step_time: 1412ms, lr: 3.30953e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:27,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.66181 samples/s/p 0:24:56 } +2024-07-30 05:45:30,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2068/ 3125], loss: 0.238, per_step_time: 1417ms, lr: 3.297183e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:30,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.64306 samples/s/p 0:24:58 } +2024-07-30 05:45:33,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2070/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 3.2848595e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:33,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.66034 samples/s/p 0:24:51 } +2024-07-30 05:45:36,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2072/ 3125], loss: 0.483, per_step_time: 1413ms, lr: 3.272554e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:36,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.65817 samples/s/p 0:24:48 } +2024-07-30 05:45:39,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2074/ 3125], loss: 0.392, per_step_time: 1415ms, lr: 3.2602668e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:39,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.65023 samples/s/p 0:24:48 } +2024-07-30 05:45:41,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2076/ 3125], loss: 0.204, per_step_time: 1414ms, lr: 3.248009e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:41,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.65745 samples/s/p 0:24:43 } +2024-07-30 05:45:44,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2078/ 3125], loss: 0.225, per_step_time: 1414ms, lr: 3.2357693e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:44,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.65733 samples/s/p 0:24:40 } +2024-07-30 05:45:47,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2080/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 3.2235562e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:47,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.65986 samples/s/p 0:24:37 } +2024-07-30 05:45:50,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2082/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 3.211364e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:50,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.66098 samples/s/p 0:24:33 } +2024-07-30 05:45:53,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2084/ 3125], loss: 0.415, per_step_time: 1413ms, lr: 3.19919e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:53,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.65989 samples/s/p 0:24:31 } +2024-07-30 05:45:56,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2086/ 3125], loss: 0.434, per_step_time: 1413ms, lr: 3.1870425e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:56,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.66057 samples/s/p 0:24:28 } +2024-07-30 05:45:58,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2088/ 3125], loss: 0.105, per_step_time: 1413ms, lr: 3.17491e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:58,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.66125 samples/s/p 0:24:25 } +2024-07-30 05:46:01,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2090/ 3125], loss: 0.137, per_step_time: 1413ms, lr: 3.1628102e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:01,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.66104 samples/s/p 0:24:22 } +2024-07-30 05:46:04,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2092/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 3.1507284e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:04,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.66092 samples/s/p 0:24:19 } +2024-07-30 05:46:07,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2094/ 3125], loss: 0.174, per_step_time: 1414ms, lr: 3.1386702e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:07,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.65668 samples/s/p 0:24:18 } +2024-07-30 05:46:10,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2096/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 3.126633e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:10,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.66131 samples/s/p 0:24:14 } +2024-07-30 05:46:13,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2098/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 3.1146197e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:13,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.66099 samples/s/p 0:24:11 } +2024-07-30 05:46:15,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2100/ 3125], loss: 0.144, per_step_time: 1414ms, lr: 3.1026272e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:15,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.65641 samples/s/p 0:24:09 } +2024-07-30 05:46:18,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2102/ 3125], loss: 0.392, per_step_time: 1414ms, lr: 3.0906529e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:18,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.65707 samples/s/p 0:24:06 } +2024-07-30 05:46:21,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2104/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 3.078708e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:21,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.66032 samples/s/p 0:24:03 } +2024-07-30 05:46:24,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2106/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 3.066784e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:24,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.66059 samples/s/p 0:24:00 } +2024-07-30 05:46:27,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2108/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 3.0548782e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:27,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.65895 samples/s/p 0:23:57 } +2024-07-30 05:46:30,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2110/ 3125], loss: 0.341, per_step_time: 1413ms, lr: 3.0429987e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:30,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.65952 samples/s/p 0:23:54 } +2024-07-30 05:46:32,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2112/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 3.0311435e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:32,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.65956 samples/s/p 0:23:51 } +2024-07-30 05:46:35,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2114/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 3.019309e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:35,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.66049 samples/s/p 0:23:48 } +2024-07-30 05:46:38,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2116/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 3.0074892e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:38,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.66144 samples/s/p 0:23:45 } +2024-07-30 05:46:41,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2118/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 2.9957056e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:41,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.65848 samples/s/p 0:23:43 } +2024-07-30 05:46:44,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2120/ 3125], loss: 0.374, per_step_time: 1414ms, lr: 2.9839336e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:44,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.65741 samples/s/p 0:23:41 } +2024-07-30 05:46:47,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2122/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 2.9721915e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:47,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.65881 samples/s/p 0:23:37 } +2024-07-30 05:46:49,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2124/ 3125], loss: 0.254, per_step_time: 1412ms, lr: 2.9604672e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:49,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.66261 samples/s/p 0:23:34 } +2024-07-30 05:46:52,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2126/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 2.94877e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:52,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.66081 samples/s/p 0:23:31 } +2024-07-30 05:46:55,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2128/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 2.9370904e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:55,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.65963 samples/s/p 0:23:29 } +2024-07-30 05:46:58,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2130/ 3125], loss: 0.234, per_step_time: 1412ms, lr: 2.9254346e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:58,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.66177 samples/s/p 0:23:25 } +2024-07-30 05:47:01,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2132/ 3125], loss: 0.417, per_step_time: 1414ms, lr: 2.9138e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:01,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.65691 samples/s/p 0:23:24 } +2024-07-30 05:47:04,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2134/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 2.9021888e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:04,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.65902 samples/s/p 0:23:20 } +2024-07-30 05:47:06,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2136/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 2.8905987e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:06,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.65827 samples/s/p 0:23:18 } +2024-07-30 05:47:09,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2138/ 3125], loss: 0.503, per_step_time: 1413ms, lr: 2.8790353e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:09,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.65935 samples/s/p 0:23:15 } +2024-07-30 05:47:12,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2140/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 2.8674899e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:12,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.65810 samples/s/p 0:23:12 } +2024-07-30 05:47:15,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2142/ 3125], loss: 0.380, per_step_time: 1414ms, lr: 2.8559742e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:15,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.65732 samples/s/p 0:23:10 } +2024-07-30 05:47:18,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2144/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 2.8444765e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:18,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.65789 samples/s/p 0:23:07 } +2024-07-30 05:47:21,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2146/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 2.8329998e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:21,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.65935 samples/s/p 0:23:03 } +2024-07-30 05:47:23,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2148/ 3125], loss: 0.317, per_step_time: 1414ms, lr: 2.8215436e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:23,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.65768 samples/s/p 0:23:01 } +2024-07-30 05:47:26,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2150/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 2.8101147e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:26,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.65981 samples/s/p 0:22:58 } +2024-07-30 05:47:26,827 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 05:48:03,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2152/ 3125], loss: 0.418, per_step_time: 1413ms, lr: 2.7987033e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:03,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.66043 samples/s/p 0:22:55 } +2024-07-30 05:48:06,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2154/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 2.7873187e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:06,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.66062 samples/s/p 0:22:52 } +2024-07-30 05:48:08,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2156/ 3125], loss: 0.291, per_step_time: 1413ms, lr: 2.7759552e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:08,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.66101 samples/s/p 0:22:49 } +2024-07-30 05:48:11,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2158/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 2.7646155e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:11,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.65822 samples/s/p 0:22:47 } +2024-07-30 05:48:14,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2160/ 3125], loss: 0.600, per_step_time: 1413ms, lr: 2.7532965e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:14,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.66021 samples/s/p 0:22:43 } +2024-07-30 05:48:17,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2162/ 3125], loss: 0.405, per_step_time: 1413ms, lr: 2.7420015e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:17,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.65929 samples/s/p 0:22:41 } +2024-07-30 05:48:20,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2164/ 3125], loss: 0.299, per_step_time: 1414ms, lr: 2.7307271e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:20,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.65663 samples/s/p 0:22:39 } +2024-07-30 05:48:23,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2166/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 2.7194767e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:23,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.65998 samples/s/p 0:22:35 } +2024-07-30 05:48:25,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2168/ 3125], loss: 0.133, per_step_time: 1414ms, lr: 2.7082532e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:25,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.65530 samples/s/p 0:22:33 } +2024-07-30 05:48:28,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2170/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 2.6970474e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:28,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.65658 samples/s/p 0:22:30 } +2024-07-30 05:48:31,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2172/ 3125], loss: 0.375, per_step_time: 1414ms, lr: 2.6858626e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:31,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.65674 samples/s/p 0:22:27 } +2024-07-30 05:48:34,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2174/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 2.6747017e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:34,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.66059 samples/s/p 0:22:24 } +2024-07-30 05:48:37,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2176/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 2.6635615e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:37,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.66072 samples/s/p 0:22:21 } +2024-07-30 05:48:40,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2178/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 2.6524512e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:40,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.65892 samples/s/p 0:22:18 } +2024-07-30 05:48:42,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2180/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 2.641356e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:42,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.65957 samples/s/p 0:22:15 } +2024-07-30 05:48:45,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2182/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 2.6302874e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:45,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.65905 samples/s/p 0:22:13 } +2024-07-30 05:48:48,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2184/ 3125], loss: 0.419, per_step_time: 1413ms, lr: 2.6192455e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:48,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |████████████████████████████████████████████ | 5.65868 samples/s/p 0:22:10 } +2024-07-30 05:48:51,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2186/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 2.6082188e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:51,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |████████████████████████████████████████████ | 5.65973 samples/s/p 0:22:07 } +2024-07-30 05:48:54,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2188/ 3125], loss: 0.160, per_step_time: 1415ms, lr: 2.5972128e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:54,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.65283 samples/s/p 0:22:06 } +2024-07-30 05:48:57,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2190/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 2.5862366e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:57,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.65927 samples/s/p 0:22:01 } +2024-07-30 05:48:59,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2192/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 2.5752811e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:59,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.66135 samples/s/p 0:21:58 } +2024-07-30 05:49:02,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2194/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 2.5643467e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:02,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.66023 samples/s/p 0:21:55 } +2024-07-30 05:49:05,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2196/ 3125], loss: 0.307, per_step_time: 1412ms, lr: 2.553433e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:05,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.66223 samples/s/p 0:21:52 } +2024-07-30 05:49:08,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2198/ 3125], loss: 0.243, per_step_time: 1414ms, lr: 2.5425493e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:08,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.65532 samples/s/p 0:21:51 } +2024-07-30 05:49:11,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2200/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 2.5316834e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:11,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.65855 samples/s/p 0:21:47 } +2024-07-30 05:49:14,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2202/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 2.5208382e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:14,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.65866 samples/s/p 0:21:44 } +2024-07-30 05:49:16,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2204/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 2.5100172e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:16,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.65856 samples/s/p 0:21:42 } +2024-07-30 05:49:19,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2206/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 2.4992198e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:19,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.66130 samples/s/p 0:21:38 } +2024-07-30 05:49:22,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2208/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 2.4884463e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:22,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.66097 samples/s/p 0:21:35 } +2024-07-30 05:49:25,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2210/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 2.4776935e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:25,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.65950 samples/s/p 0:21:33 } +2024-07-30 05:49:28,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2212/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 2.4669646e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:28,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.65959 samples/s/p 0:21:30 } +2024-07-30 05:49:31,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2214/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 2.4562596e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:31,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.65846 samples/s/p 0:21:27 } +2024-07-30 05:49:33,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2216/ 3125], loss: 0.425, per_step_time: 1414ms, lr: 2.4455724e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:33,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.65697 samples/s/p 0:21:25 } +2024-07-30 05:49:36,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2218/ 3125], loss: 0.370, per_step_time: 1415ms, lr: 2.4349092e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:36,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.65276 samples/s/p 0:21:23 } +2024-07-30 05:49:39,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2220/ 3125], loss: 0.275, per_step_time: 1412ms, lr: 2.424267e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:39,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.66196 samples/s/p 0:21:18 } +2024-07-30 05:49:42,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2222/ 3125], loss: 0.233, per_step_time: 1414ms, lr: 2.4136511e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:42,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.65499 samples/s/p 0:21:17 } +2024-07-30 05:49:45,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2224/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 2.4030626e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:45,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.65988 samples/s/p 0:21:13 } +2024-07-30 05:49:48,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2226/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 2.3924918e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:48,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.66052 samples/s/p 0:21:10 } +2024-07-30 05:49:50,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2228/ 3125], loss: 0.080, per_step_time: 1413ms, lr: 2.3819446e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:50,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.66014 samples/s/p 0:21:07 } +2024-07-30 05:49:53,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2230/ 3125], loss: 0.273, per_step_time: 1412ms, lr: 2.3714185e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:53,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.66249 samples/s/p 0:21:04 } +2024-07-30 05:49:56,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2232/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 2.3609131e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:56,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.66117 samples/s/p 0:21:01 } +2024-07-30 05:49:59,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2234/ 3125], loss: 0.201, per_step_time: 1412ms, lr: 2.3504346e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:59,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.66222 samples/s/p 0:20:58 } +2024-07-30 05:50:02,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2236/ 3125], loss: 0.298, per_step_time: 1412ms, lr: 2.339977e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:02,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.66298 samples/s/p 0:20:55 } +2024-07-30 05:50:05,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2238/ 3125], loss: 0.213, per_step_time: 1414ms, lr: 2.3295432e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:05,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.65713 samples/s/p 0:20:54 } +2024-07-30 05:50:07,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2240/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 2.3191302e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:07,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.66084 samples/s/p 0:20:50 } +2024-07-30 05:50:10,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2242/ 3125], loss: 0.452, per_step_time: 1413ms, lr: 2.3087412e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:10,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.65856 samples/s/p 0:20:48 } +2024-07-30 05:50:13,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2244/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 2.298379e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:13,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.66139 samples/s/p 0:20:44 } +2024-07-30 05:50:16,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2246/ 3125], loss: 0.451, per_step_time: 1413ms, lr: 2.2880344e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:16,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.65911 samples/s/p 0:20:42 } +2024-07-30 05:50:19,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2248/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 2.277714e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:19,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.66063 samples/s/p 0:20:39 } +2024-07-30 05:50:22,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2250/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 2.2674172e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:22,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.65952 samples/s/p 0:20:36 } +2024-07-30 05:50:24,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2252/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 2.2571385e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:24,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.65807 samples/s/p 0:20:34 } +2024-07-30 05:50:27,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2254/ 3125], loss: 0.231, per_step_time: 1414ms, lr: 2.2468895e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:27,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.65694 samples/s/p 0:20:31 } +2024-07-30 05:50:30,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2256/ 3125], loss: 0.151, per_step_time: 1412ms, lr: 2.2366582e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:30,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.66203 samples/s/p 0:20:27 } +2024-07-30 05:50:33,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2258/ 3125], loss: 0.187, per_step_time: 1414ms, lr: 2.226451e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:33,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.65579 samples/s/p 0:20:26 } +2024-07-30 05:50:36,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2260/ 3125], loss: 0.350, per_step_time: 1414ms, lr: 2.2162705e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:36,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.65749 samples/s/p 0:20:23 } +2024-07-30 05:50:39,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2262/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 2.2061108e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:39,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.65808 samples/s/p 0:20:20 } +2024-07-30 05:50:41,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2264/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 2.1959691e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:41,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.66088 samples/s/p 0:20:16 } +2024-07-30 05:50:44,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2266/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 2.1858513e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:44,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.66093 samples/s/p 0:20:13 } +2024-07-30 05:50:47,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2268/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 2.1757631e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:47,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.66033 samples/s/p 0:20:11 } +2024-07-30 05:50:50,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2270/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 2.165693e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:50,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.65983 samples/s/p 0:20:08 } +2024-07-30 05:50:53,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2272/ 3125], loss: 0.159, per_step_time: 1414ms, lr: 2.1556467e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:53,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.65611 samples/s/p 0:20:06 } +2024-07-30 05:50:56,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2274/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 2.145627e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:56,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.65874 samples/s/p 0:20:03 } +2024-07-30 05:50:58,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2276/ 3125], loss: 0.102, per_step_time: 1413ms, lr: 2.1356195e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:58,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.65809 samples/s/p 0:20:00 } +2024-07-30 05:51:01,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2278/ 3125], loss: 0.282, per_step_time: 1414ms, lr: 2.1256416e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:01,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.65730 samples/s/p 0:19:57 } +2024-07-30 05:51:04,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2280/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 2.1156906e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:04,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.65606 samples/s/p 0:19:55 } +2024-07-30 05:51:07,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2282/ 3125], loss: 0.166, per_step_time: 1415ms, lr: 2.1057605e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:07,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.65265 samples/s/p 0:19:53 } +2024-07-30 05:51:10,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2284/ 3125], loss: 0.233, per_step_time: 1415ms, lr: 2.0958453e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:10,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.65334 samples/s/p 0:19:50 } +2024-07-30 05:51:13,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2286/ 3125], loss: 0.250, per_step_time: 1414ms, lr: 2.0859599e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:13,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.65441 samples/s/p 0:19:47 } +2024-07-30 05:51:15,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2288/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 2.0760953e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:15,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.65870 samples/s/p 0:19:43 } +2024-07-30 05:51:18,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2290/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 2.0662516e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:18,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.65855 samples/s/p 0:19:40 } +2024-07-30 05:51:21,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2292/ 3125], loss: 0.436, per_step_time: 1413ms, lr: 2.0564347e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:21,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.65825 samples/s/p 0:19:37 } +2024-07-30 05:51:24,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2294/ 3125], loss: 0.319, per_step_time: 1412ms, lr: 2.0466386e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:24,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.66211 samples/s/p 0:19:34 } +2024-07-30 05:51:27,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2296/ 3125], loss: 0.166, per_step_time: 1415ms, lr: 2.0368695e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:27,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.64974 samples/s/p 0:19:33 } +2024-07-30 05:51:30,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2298/ 3125], loss: 0.158, per_step_time: 1412ms, lr: 2.0271182e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:30,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.66177 samples/s/p 0:19:28 } +2024-07-30 05:51:32,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2300/ 3125], loss: 0.330, per_step_time: 1412ms, lr: 2.0173967e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:32,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.66291 samples/s/p 0:19:25 } +2024-07-30 05:51:35,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2302/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 2.007693e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:35,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.65873 samples/s/p 0:19:23 } +2024-07-30 05:51:38,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2304/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 1.9980102e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:38,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.66149 samples/s/p 0:19:20 } +2024-07-30 05:51:41,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2306/ 3125], loss: 0.122, per_step_time: 1412ms, lr: 1.9883512e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:41,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.66299 samples/s/p 0:19:16 } +2024-07-30 05:51:44,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2308/ 3125], loss: 0.206, per_step_time: 1412ms, lr: 1.9787161e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:44,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.66215 samples/s/p 0:19:14 } +2024-07-30 05:51:47,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2310/ 3125], loss: 0.457, per_step_time: 1412ms, lr: 1.969102e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:47,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.66206 samples/s/p 0:19:11 } +2024-07-30 05:51:49,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2312/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 1.9595146e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:49,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.66053 samples/s/p 0:19:09 } +2024-07-30 05:51:52,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2314/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 1.949951e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:52,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.66086 samples/s/p 0:19:06 } +2024-07-30 05:51:55,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2316/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 1.9404054e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:55,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.66158 samples/s/p 0:19:03 } +2024-07-30 05:51:58,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2318/ 3125], loss: 0.256, per_step_time: 1414ms, lr: 1.9308835e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:58,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.65641 samples/s/p 0:19:01 } +2024-07-30 05:52:01,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2320/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 1.9213884e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:01,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.65824 samples/s/p 0:18:58 } +2024-07-30 05:52:04,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2322/ 3125], loss: 0.131, per_step_time: 1414ms, lr: 1.9119173e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:04,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.65572 samples/s/p 0:18:55 } +2024-07-30 05:52:06,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2324/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 1.902464e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:06,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.66008 samples/s/p 0:18:52 } +2024-07-30 05:52:09,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2326/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 1.8930375e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:09,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.66017 samples/s/p 0:18:49 } +2024-07-30 05:52:12,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2328/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 1.8836319e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:12,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.65990 samples/s/p 0:18:46 } +2024-07-30 05:52:15,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2330/ 3125], loss: 0.352, per_step_time: 1412ms, lr: 1.8742502e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:15,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.66278 samples/s/p 0:18:43 } +2024-07-30 05:52:18,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2332/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 1.8648892e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:18,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.65890 samples/s/p 0:18:41 } +2024-07-30 05:52:21,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2334/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 1.8555491e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:21,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.65855 samples/s/p 0:18:38 } +2024-07-30 05:52:23,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2336/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 1.8462389e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:23,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.65836 samples/s/p 0:18:35 } +2024-07-30 05:52:26,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2338/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 1.8369495e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:26,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.65846 samples/s/p 0:18:32 } +2024-07-30 05:52:29,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2340/ 3125], loss: 0.076, per_step_time: 1412ms, lr: 1.827684e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:29,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.66200 samples/s/p 0:18:29 } +2024-07-30 05:52:32,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2342/ 3125], loss: 0.252, per_step_time: 1415ms, lr: 1.8184393e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:32,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.65225 samples/s/p 0:18:28 } +2024-07-30 05:52:35,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2344/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 1.8092155e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:35,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.66031 samples/s/p 0:18:23 } +2024-07-30 05:52:38,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2346/ 3125], loss: 0.045, per_step_time: 1413ms, lr: 1.8000215e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:38,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.65875 samples/s/p 0:18:21 } +2024-07-30 05:52:40,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2348/ 3125], loss: 0.177, per_step_time: 1414ms, lr: 1.7908394e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:40,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.65617 samples/s/p 0:18:18 } +2024-07-30 05:52:43,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2350/ 3125], loss: 0.268, per_step_time: 1414ms, lr: 1.78169e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:43,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.65746 samples/s/p 0:18:15 } +2024-07-30 05:52:46,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2352/ 3125], loss: 0.405, per_step_time: 1413ms, lr: 1.7725617e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:46,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.65960 samples/s/p 0:18:12 } +2024-07-30 05:52:49,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2354/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 1.7634571e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:49,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.66021 samples/s/p 0:18:09 } +2024-07-30 05:52:52,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2356/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 1.7543672e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:52,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.65949 samples/s/p 0:18:07 } +2024-07-30 05:52:55,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2358/ 3125], loss: 0.144, per_step_time: 1414ms, lr: 1.7453104e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:55,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.65671 samples/s/p 0:18:04 } +2024-07-30 05:52:57,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2360/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 1.7362743e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:57,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.65804 samples/s/p 0:18:01 } +2024-07-30 05:53:00,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2362/ 3125], loss: 0.292, per_step_time: 1414ms, lr: 1.7272562e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:00,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.65611 samples/s/p 0:17:59 } +2024-07-30 05:53:03,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2364/ 3125], loss: 0.434, per_step_time: 1413ms, lr: 1.7182677e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:03,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.65959 samples/s/p 0:17:55 } +2024-07-30 05:53:06,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2366/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 1.7093032e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:06,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.65970 samples/s/p 0:17:52 } +2024-07-30 05:53:09,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2368/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 1.7003566e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:09,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.65973 samples/s/p 0:17:50 } +2024-07-30 05:53:12,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2370/ 3125], loss: 0.115, per_step_time: 1412ms, lr: 1.6914368e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:12,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.66172 samples/s/p 0:17:46 } +2024-07-30 05:53:14,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2372/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 1.6825408e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:14,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |█████████████████████████████████████████████ | 5.66158 samples/s/p 0:17:44 } +2024-07-30 05:53:17,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2374/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 1.6736627e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:17,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |█████████████████████████████████████████████ | 5.65940 samples/s/p 0:17:41 } +2024-07-30 05:53:20,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2376/ 3125], loss: 0.204, per_step_time: 1412ms, lr: 1.6648083e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:20,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.66194 samples/s/p 0:17:38 } +2024-07-30 05:53:23,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2378/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 1.655975e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:23,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.65980 samples/s/p 0:17:35 } +2024-07-30 05:53:26,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2380/ 3125], loss: 0.391, per_step_time: 1413ms, lr: 1.6471714e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:26,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.66128 samples/s/p 0:17:32 } +2024-07-30 05:53:29,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2382/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 1.6383856e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:29,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.66023 samples/s/p 0:17:30 } +2024-07-30 05:53:31,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2384/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 1.6296268e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:31,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.66000 samples/s/p 0:17:27 } +2024-07-30 05:53:34,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2386/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 1.6208917e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:34,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.65926 samples/s/p 0:17:24 } +2024-07-30 05:53:37,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2388/ 3125], loss: 0.043, per_step_time: 1413ms, lr: 1.6121744e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:37,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.66099 samples/s/p 0:17:21 } +2024-07-30 05:53:40,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2390/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 1.603484e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:40,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.65917 samples/s/p 0:17:19 } +2024-07-30 05:53:43,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2392/ 3125], loss: 0.164, per_step_time: 1414ms, lr: 1.5948176e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:43,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.65617 samples/s/p 0:17:16 } +2024-07-30 05:53:46,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2394/ 3125], loss: 0.124, per_step_time: 1414ms, lr: 1.586169e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:46,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.65711 samples/s/p 0:17:13 } +2024-07-30 05:53:48,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2396/ 3125], loss: 0.369, per_step_time: 1414ms, lr: 1.5775501e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:48,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.65771 samples/s/p 0:17:10 } +2024-07-30 05:53:51,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2398/ 3125], loss: 0.399, per_step_time: 1414ms, lr: 1.5689491e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:51,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.65626 samples/s/p 0:17:08 } +2024-07-30 05:53:54,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2400/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 1.560378e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:54,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.66166 samples/s/p 0:17:04 } +2024-07-30 05:53:57,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2402/ 3125], loss: 0.127, per_step_time: 1413ms, lr: 1.5518218e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:57,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.65899 samples/s/p 0:17:02 } +2024-07-30 05:54:00,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2404/ 3125], loss: 0.141, per_step_time: 1413ms, lr: 1.5432924e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:00,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.65802 samples/s/p 0:16:59 } +2024-07-30 05:54:03,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2406/ 3125], loss: 0.215, per_step_time: 1414ms, lr: 1.5347868e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:03,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.65712 samples/s/p 0:16:56 } +2024-07-30 05:54:05,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2408/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 1.5263021e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:05,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.65437 samples/s/p 0:16:54 } +2024-07-30 05:54:08,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2410/ 3125], loss: 0.340, per_step_time: 1414ms, lr: 1.5178442e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:08,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.65684 samples/s/p 0:16:51 } +2024-07-30 05:54:11,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2412/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 1.509407e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:11,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.65851 samples/s/p 0:16:48 } +2024-07-30 05:54:14,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2414/ 3125], loss: 0.275, per_step_time: 1414ms, lr: 1.5009999e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:14,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.65745 samples/s/p 0:16:45 } +2024-07-30 05:54:17,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2416/ 3125], loss: 0.377, per_step_time: 1413ms, lr: 1.4926076e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:17,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.66106 samples/s/p 0:16:41 } +2024-07-30 05:54:20,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2418/ 3125], loss: 0.317, per_step_time: 1414ms, lr: 1.4842361e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:20,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.65768 samples/s/p 0:16:39 } +2024-07-30 05:54:22,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2420/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 1.4758915e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:22,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.66100 samples/s/p 0:16:36 } +2024-07-30 05:54:25,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2422/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 1.4675706e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:25,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.66035 samples/s/p 0:16:33 } +2024-07-30 05:54:28,659 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2424/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 1.4592736e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:28,660 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.66079 samples/s/p 0:16:30 } +2024-07-30 05:54:31,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2426/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 1.4509976e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:31,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.65968 samples/s/p 0:16:28 } +2024-07-30 05:54:34,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2428/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 1.4427512e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:34,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.66085 samples/s/p 0:16:25 } +2024-07-30 05:54:37,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2430/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 1.4345228e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:37,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.66165 samples/s/p 0:16:22 } +2024-07-30 05:54:39,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2432/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 1.4263212e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:39,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.65941 samples/s/p 0:16:19 } +2024-07-30 05:54:42,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2434/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 1.4181346e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:42,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.66035 samples/s/p 0:16:16 } +2024-07-30 05:54:45,660 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2436/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 1.4099747e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:45,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.66044 samples/s/p 0:16:13 } +2024-07-30 05:54:48,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2438/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 1.4018386e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:48,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.65900 samples/s/p 0:16:11 } +2024-07-30 05:54:51,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2440/ 3125], loss: 0.349, per_step_time: 1413ms, lr: 1.3937324e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:51,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.66046 samples/s/p 0:16:08 } +2024-07-30 05:54:54,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2442/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 1.385638e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:54,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.65877 samples/s/p 0:16:05 } +2024-07-30 05:54:56,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2444/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 1.3775735e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:56,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.65963 samples/s/p 0:16:02 } +2024-07-30 05:54:59,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2446/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 1.3695359e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:59,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.65871 samples/s/p 0:15:59 } +2024-07-30 05:55:02,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2448/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 1.3615131e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:02,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.65821 samples/s/p 0:15:57 } +2024-07-30 05:55:05,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2450/ 3125], loss: 0.194, per_step_time: 1418ms, lr: 1.3535141e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:05,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.63861 samples/s/p 0:15:57 } +2024-07-30 05:55:08,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2452/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 1.345545e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:08,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.65959 samples/s/p 0:15:51 } +2024-07-30 05:55:11,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2454/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 1.3375967e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:11,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.65896 samples/s/p 0:15:48 } +2024-07-30 05:55:14,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2456/ 3125], loss: 0.244, per_step_time: 1414ms, lr: 1.3296693e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:14,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.65734 samples/s/p 0:15:46 } +2024-07-30 05:55:16,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2458/ 3125], loss: 0.178, per_step_time: 1415ms, lr: 1.3217628e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:16,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.65170 samples/s/p 0:15:44 } +2024-07-30 05:55:19,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2460/ 3125], loss: 0.284, per_step_time: 1412ms, lr: 1.313889e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:19,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.66184 samples/s/p 0:15:39 } +2024-07-30 05:55:22,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2462/ 3125], loss: 0.099, per_step_time: 1413ms, lr: 1.3060301e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:22,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.66044 samples/s/p 0:15:37 } +2024-07-30 05:55:25,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2464/ 3125], loss: 0.348, per_step_time: 1413ms, lr: 1.2981981e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:25,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.66077 samples/s/p 0:15:34 } +2024-07-30 05:55:28,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2466/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 1.290381e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:28,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.65842 samples/s/p 0:15:31 } +2024-07-30 05:55:31,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2468/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 1.2825936e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:31,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.66109 samples/s/p 0:15:28 } +2024-07-30 05:55:33,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2470/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 1.274833e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:33,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.66017 samples/s/p 0:15:25 } +2024-07-30 05:55:36,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2472/ 3125], loss: 0.237, per_step_time: 1414ms, lr: 1.2670934e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:36,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.65535 samples/s/p 0:15:23 } +2024-07-30 05:55:39,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2474/ 3125], loss: 0.373, per_step_time: 1413ms, lr: 1.2593746e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:39,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.65943 samples/s/p 0:15:20 } +2024-07-30 05:55:42,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2476/ 3125], loss: 0.178, per_step_time: 1414ms, lr: 1.2516796e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:42,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.65768 samples/s/p 0:15:17 } +2024-07-30 05:55:45,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2478/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 1.2440115e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:45,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.65993 samples/s/p 0:15:14 } +2024-07-30 05:55:48,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2480/ 3125], loss: 0.105, per_step_time: 1413ms, lr: 1.2363672e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:48,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.65927 samples/s/p 0:15:11 } +2024-07-30 05:55:50,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2482/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 1.2287408e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:50,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.66034 samples/s/p 0:15:08 } +2024-07-30 05:55:53,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2484/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 1.2211382e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:53,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.65868 samples/s/p 0:15:06 } +2024-07-30 05:55:56,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2486/ 3125], loss: 0.445, per_step_time: 1413ms, lr: 1.2135625e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:56,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.65838 samples/s/p 0:15:03 } +2024-07-30 05:55:59,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2488/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 1.2060076e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:59,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.66083 samples/s/p 0:15:00 } +2024-07-30 05:56:02,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2490/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 1.1984795e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:02,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.66111 samples/s/p 0:14:57 } +2024-07-30 05:56:05,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2492/ 3125], loss: 0.110, per_step_time: 1413ms, lr: 1.1909723e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:05,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.65917 samples/s/p 0:14:54 } +2024-07-30 05:56:07,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2494/ 3125], loss: 0.096, per_step_time: 1413ms, lr: 1.18348595e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:07,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.66021 samples/s/p 0:14:51 } +2024-07-30 05:56:10,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2496/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 1.1760235e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:10,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.65879 samples/s/p 0:14:49 } +2024-07-30 05:56:13,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2498/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 1.1685848e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:13,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.65884 samples/s/p 0:14:46 } +2024-07-30 05:56:16,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2500/ 3125], loss: 0.334, per_step_time: 1414ms, lr: 1.1611759e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:16,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.65628 samples/s/p 0:14:43 } +2024-07-30 05:56:19,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2502/ 3125], loss: 0.413, per_step_time: 1414ms, lr: 1.153782e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:19,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.65410 samples/s/p 0:14:41 } +2024-07-30 05:56:22,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2504/ 3125], loss: 0.376, per_step_time: 1413ms, lr: 1.14641786e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:22,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.66039 samples/s/p 0:14:37 } +2024-07-30 05:56:24,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2506/ 3125], loss: 0.242, per_step_time: 1412ms, lr: 1.13907156e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:24,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.66208 samples/s/p 0:14:34 } +2024-07-30 05:56:27,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2508/ 3125], loss: 0.164, per_step_time: 1413ms, lr: 1.1317521e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:27,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.66123 samples/s/p 0:14:31 } +2024-07-30 05:56:30,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2510/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 1.1244505e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:30,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.66030 samples/s/p 0:14:29 } +2024-07-30 05:56:33,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2512/ 3125], loss: 0.341, per_step_time: 1414ms, lr: 1.11717874e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:33,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.65503 samples/s/p 0:14:27 } +2024-07-30 05:56:36,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2514/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 1.1099249e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:36,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.65989 samples/s/p 0:14:23 } +2024-07-30 05:56:39,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2516/ 3125], loss: 0.254, per_step_time: 1414ms, lr: 1.1027008e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:39,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.65697 samples/s/p 0:14:21 } +2024-07-30 05:56:41,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2518/ 3125], loss: 0.192, per_step_time: 1415ms, lr: 1.0954946e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:41,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.65330 samples/s/p 0:14:18 } +2024-07-30 05:56:44,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2520/ 3125], loss: 0.403, per_step_time: 1412ms, lr: 1.0883152e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:44,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.66192 samples/s/p 0:14:14 } +2024-07-30 05:56:47,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2522/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 1.0811567e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:47,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.65905 samples/s/p 0:14:12 } +2024-07-30 05:56:50,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2524/ 3125], loss: 0.348, per_step_time: 1412ms, lr: 1.074025e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:50,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.66189 samples/s/p 0:14:09 } +2024-07-30 05:56:53,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2526/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 1.0669142e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:53,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.66145 samples/s/p 0:14:06 } +2024-07-30 05:56:56,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2528/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 1.0598272e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:56,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.65852 samples/s/p 0:14:04 } +2024-07-30 05:56:58,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2530/ 3125], loss: 0.130, per_step_time: 1413ms, lr: 1.0527551e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:58,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.66165 samples/s/p 0:14:00 } +2024-07-30 05:57:01,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2532/ 3125], loss: 0.062, per_step_time: 1413ms, lr: 1.04571576e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:01,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.66132 samples/s/p 0:13:57 } +2024-07-30 05:57:04,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2534/ 3125], loss: 0.364, per_step_time: 1414ms, lr: 1.0387033e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:04,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.65590 samples/s/p 0:13:55 } +2024-07-30 05:57:07,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2536/ 3125], loss: 0.319, per_step_time: 1412ms, lr: 1.0317057e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:07,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.66245 samples/s/p 0:13:52 } +2024-07-30 05:57:10,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2538/ 3125], loss: 0.071, per_step_time: 1415ms, lr: 1.0247349e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:10,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.65155 samples/s/p 0:13:50 } +2024-07-30 05:57:13,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2540/ 3125], loss: 0.294, per_step_time: 1413ms, lr: 1.017788e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:13,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.65784 samples/s/p 0:13:47 } +2024-07-30 05:57:15,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2542/ 3125], loss: 0.164, per_step_time: 1414ms, lr: 1.0108679e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:15,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.65482 samples/s/p 0:13:44 } +2024-07-30 05:57:18,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2544/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 1.0039687e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:18,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.65797 samples/s/p 0:13:41 } +2024-07-30 05:57:21,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2546/ 3125], loss: 0.241, per_step_time: 1412ms, lr: 9.9709034e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:21,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.66262 samples/s/p 0:13:37 } +2024-07-30 05:57:24,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2548/ 3125], loss: 0.436, per_step_time: 1414ms, lr: 9.902358e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:24,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.65702 samples/s/p 0:13:35 } +2024-07-30 05:57:27,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2550/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 9.834021e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:27,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.66110 samples/s/p 0:13:32 } +2024-07-30 05:57:30,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2552/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 9.765982e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:30,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.65837 samples/s/p 0:13:30 } +2024-07-30 05:57:32,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2554/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 9.6981225e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:32,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.66087 samples/s/p 0:13:26 } +2024-07-30 05:57:35,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2556/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 9.630531e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:35,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.66100 samples/s/p 0:13:24 } +2024-07-30 05:57:38,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2558/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 9.5631776e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:38,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.65998 samples/s/p 0:13:21 } +2024-07-30 05:57:41,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2560/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 9.4960626e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:41,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.66099 samples/s/p 0:13:18 } +2024-07-30 05:57:44,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2562/ 3125], loss: 0.318, per_step_time: 1426ms, lr: 9.429186e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:44,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.60950 samples/s/p 0:13:22 } +2024-07-30 05:57:47,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2564/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 9.362459e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:47,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |███████████████████████████████████████████████ | 5.65960 samples/s/p 0:13:12 } +2024-07-30 05:57:49,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2566/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 9.29603e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:49,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |███████████████████████████████████████████████ | 5.65995 samples/s/p 0:13:10 } +2024-07-30 05:57:52,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2568/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 9.2298386e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:52,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.65604 samples/s/p 0:13:07 } +2024-07-30 05:57:55,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2570/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 9.163886e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:55,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.66052 samples/s/p 0:13:04 } +2024-07-30 05:57:58,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2572/ 3125], loss: 0.212, per_step_time: 1414ms, lr: 9.098202e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:58,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.65564 samples/s/p 0:13:02 } +2024-07-30 05:58:01,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2574/ 3125], loss: 0.321, per_step_time: 1413ms, lr: 9.032637e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:01,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.65809 samples/s/p 0:12:59 } +2024-07-30 05:58:04,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2576/ 3125], loss: 0.447, per_step_time: 1413ms, lr: 8.9674295e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:04,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.65799 samples/s/p 0:12:56 } +2024-07-30 05:58:06,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2578/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 8.9024006e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:06,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.66043 samples/s/p 0:12:53 } +2024-07-30 05:58:09,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2580/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 8.83764e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:09,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.66042 samples/s/p 0:12:50 } +2024-07-30 05:58:12,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2582/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 8.7730584e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:12,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.65868 samples/s/p 0:12:47 } +2024-07-30 05:58:15,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2584/ 3125], loss: 0.226, per_step_time: 1414ms, lr: 8.708715e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:15,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.65672 samples/s/p 0:12:45 } +2024-07-30 05:58:18,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2586/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 8.64467e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:18,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.66060 samples/s/p 0:12:41 } +2024-07-30 05:58:21,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2588/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 8.580774e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:21,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.66024 samples/s/p 0:12:38 } +2024-07-30 05:58:23,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2590/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 8.5171756e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:23,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.65820 samples/s/p 0:12:36 } +2024-07-30 05:58:26,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2592/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 8.453816e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:26,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.66084 samples/s/p 0:12:33 } +2024-07-30 05:58:29,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2594/ 3125], loss: 0.322, per_step_time: 1413ms, lr: 8.390635e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:29,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.65776 samples/s/p 0:12:30 } +2024-07-30 05:58:32,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2596/ 3125], loss: 0.275, per_step_time: 1414ms, lr: 8.327722e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:32,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.65696 samples/s/p 0:12:28 } +2024-07-30 05:58:35,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2598/ 3125], loss: 0.081, per_step_time: 1414ms, lr: 8.265048e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:35,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.65679 samples/s/p 0:12:25 } +2024-07-30 05:58:38,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2600/ 3125], loss: 0.168, per_step_time: 1412ms, lr: 8.202642e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:38,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.66196 samples/s/p 0:12:21 } +2024-07-30 05:58:40,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2602/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 8.1404444e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:40,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.65912 samples/s/p 0:12:19 } +2024-07-30 05:58:43,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2604/ 3125], loss: 0.317, per_step_time: 1412ms, lr: 8.078426e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:43,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.66295 samples/s/p 0:12:16 } +2024-07-30 05:58:46,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2606/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 8.0167055e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:46,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.66122 samples/s/p 0:12:13 } +2024-07-30 05:58:49,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2608/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 7.955163e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:49,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.65892 samples/s/p 0:12:10 } +2024-07-30 05:58:52,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2610/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 7.893949e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:52,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.66132 samples/s/p 0:12:07 } +2024-07-30 05:58:55,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2612/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 7.8329144e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:55,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.66031 samples/s/p 0:12:05 } +2024-07-30 05:58:57,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2614/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 7.7721474e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:57,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.66165 samples/s/p 0:12:02 } +2024-07-30 05:59:00,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2616/ 3125], loss: 0.175, per_step_time: 1412ms, lr: 7.7115295e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:00,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.66227 samples/s/p 0:11:59 } +2024-07-30 05:59:03,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2618/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 7.6512094e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:03,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.65973 samples/s/p 0:11:56 } +2024-07-30 05:59:06,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2620/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 7.591128e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:06,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.66096 samples/s/p 0:11:53 } +2024-07-30 05:59:09,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2622/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 7.5312556e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:09,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.65991 samples/s/p 0:11:50 } +2024-07-30 05:59:12,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2624/ 3125], loss: 0.343, per_step_time: 1425ms, lr: 7.47165e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:12,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.61294 samples/s/p 0:11:54 } +2024-07-30 05:59:14,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2626/ 3125], loss: 0.095, per_step_time: 1414ms, lr: 7.4122546e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:14,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.65766 samples/s/p 0:11:45 } +2024-07-30 05:59:17,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2628/ 3125], loss: 0.128, per_step_time: 1415ms, lr: 7.353127e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:17,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.65295 samples/s/p 0:11:43 } +2024-07-30 05:59:20,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2630/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 7.294178e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:20,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.66145 samples/s/p 0:11:39 } +2024-07-30 05:59:23,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2632/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 7.235497e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:23,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.66024 samples/s/p 0:11:36 } +2024-07-30 05:59:26,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2634/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 7.177055e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:26,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.65853 samples/s/p 0:11:34 } +2024-07-30 05:59:29,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2636/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 7.118821e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:29,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.65928 samples/s/p 0:11:31 } +2024-07-30 05:59:31,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2638/ 3125], loss: 0.309, per_step_time: 1414ms, lr: 7.0609154e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:31,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.65736 samples/s/p 0:11:28 } +2024-07-30 05:59:34,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2640/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 7.003158e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:34,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.65799 samples/s/p 0:11:25 } +2024-07-30 05:59:37,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2642/ 3125], loss: 0.435, per_step_time: 1415ms, lr: 6.94561e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:37,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.65325 samples/s/p 0:11:23 } +2024-07-30 05:59:40,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2644/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 6.8883594e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:40,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.65832 samples/s/p 0:11:20 } +2024-07-30 05:59:43,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2646/ 3125], loss: 0.293, per_step_time: 1413ms, lr: 6.831318e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:43,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.66083 samples/s/p 0:11:16 } +2024-07-30 05:59:46,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2648/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 6.774515e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:46,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.66013 samples/s/p 0:11:14 } +2024-07-30 05:59:48,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2650/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 6.71792e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:48,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.65973 samples/s/p 0:11:11 } +2024-07-30 05:59:51,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2652/ 3125], loss: 0.039, per_step_time: 1413ms, lr: 6.661624e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:51,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.66103 samples/s/p 0:11:08 } +2024-07-30 05:59:54,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2654/ 3125], loss: 0.388, per_step_time: 1416ms, lr: 6.605536e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:54,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.64828 samples/s/p 0:11:07 } +2024-07-30 05:59:57,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2656/ 3125], loss: 0.434, per_step_time: 1413ms, lr: 6.549686e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:57,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.66122 samples/s/p 0:11:02 } +2024-07-30 06:00:00,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2658/ 3125], loss: 0.437, per_step_time: 1415ms, lr: 6.494045e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:00,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.65320 samples/s/p 0:11:00 } +2024-07-30 06:00:03,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2660/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 6.4386725e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:03,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.66106 samples/s/p 0:10:57 } +2024-07-30 06:00:05,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2662/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 6.383538e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:05,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.65936 samples/s/p 0:10:54 } +2024-07-30 06:00:08,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2664/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 6.328612e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:08,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.65971 samples/s/p 0:10:51 } +2024-07-30 06:00:11,659 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2666/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 6.273955e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:11,660 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.66110 samples/s/p 0:10:48 } +2024-07-30 06:00:14,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2668/ 3125], loss: 0.143, per_step_time: 1412ms, lr: 6.2194765e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:14,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.66175 samples/s/p 0:10:45 } +2024-07-30 06:00:17,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2670/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 6.1652656e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:17,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.66155 samples/s/p 0:10:42 } +2024-07-30 06:00:20,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2672/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 6.111294e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:20,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.65815 samples/s/p 0:10:40 } +2024-07-30 06:00:22,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2674/ 3125], loss: 0.306, per_step_time: 1412ms, lr: 6.05759e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:22,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.66220 samples/s/p 0:10:37 } +2024-07-30 06:00:25,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2676/ 3125], loss: 0.108, per_step_time: 1413ms, lr: 6.0041245e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:25,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.66018 samples/s/p 0:10:34 } +2024-07-30 06:00:28,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2678/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 5.950838e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:28,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.65782 samples/s/p 0:10:32 } +2024-07-30 06:00:31,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2680/ 3125], loss: 0.439, per_step_time: 1413ms, lr: 5.89779e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:31,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.66128 samples/s/p 0:10:28 } +2024-07-30 06:00:34,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2682/ 3125], loss: 0.156, per_step_time: 1414ms, lr: 5.8449803e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:34,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.65692 samples/s/p 0:10:26 } +2024-07-30 06:00:37,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2684/ 3125], loss: 0.422, per_step_time: 1414ms, lr: 5.792439e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:37,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.65684 samples/s/p 0:10:23 } +2024-07-30 06:00:39,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2686/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 5.7401657e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:39,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.66159 samples/s/p 0:10:20 } +2024-07-30 06:00:42,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2688/ 3125], loss: 0.657, per_step_time: 1413ms, lr: 5.6880115e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:42,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.66024 samples/s/p 0:10:17 } +2024-07-30 06:00:45,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2690/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 5.6361852e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:45,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.65958 samples/s/p 0:10:14 } +2024-07-30 06:00:48,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2692/ 3125], loss: 0.253, per_step_time: 1414ms, lr: 5.5845973e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:48,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.65737 samples/s/p 0:10:12 } +2024-07-30 06:00:51,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2694/ 3125], loss: 0.072, per_step_time: 1415ms, lr: 5.5332183e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:51,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.65352 samples/s/p 0:10:09 } +2024-07-30 06:00:54,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2696/ 3125], loss: 0.481, per_step_time: 1414ms, lr: 5.4820475e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:54,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.65441 samples/s/p 0:10:06 } +2024-07-30 06:00:57,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2698/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 5.4311453e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:57,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.66057 samples/s/p 0:10:03 } +2024-07-30 06:00:59,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2700/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 5.3805113e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:59,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.66128 samples/s/p 0:10:00 } +2024-07-30 06:01:02,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2702/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 5.3300855e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:02,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.65907 samples/s/p 0:09:57 } +2024-07-30 06:01:05,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2704/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 5.2798686e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:05,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.65921 samples/s/p 0:09:55 } +2024-07-30 06:01:08,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2706/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 5.22992e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:08,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.65976 samples/s/p 0:09:52 } +2024-07-30 06:01:11,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2708/ 3125], loss: 0.297, per_step_time: 1414ms, lr: 5.1802097e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:11,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.65670 samples/s/p 0:09:49 } +2024-07-30 06:01:14,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2710/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 5.1307378e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:14,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.65893 samples/s/p 0:09:46 } +2024-07-30 06:01:16,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2712/ 3125], loss: 0.024, per_step_time: 1413ms, lr: 5.081445e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:16,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.65789 samples/s/p 0:09:43 } +2024-07-30 06:01:19,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2714/ 3125], loss: 0.197, per_step_time: 1414ms, lr: 5.03242e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:19,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.65408 samples/s/p 0:09:41 } +2024-07-30 06:01:22,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2716/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 4.9836633e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:22,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.65880 samples/s/p 0:09:38 } +2024-07-30 06:01:25,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2718/ 3125], loss: 0.164, per_step_time: 1414ms, lr: 4.9351453e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:25,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.65572 samples/s/p 0:09:35 } +2024-07-30 06:01:28,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2720/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 4.886836e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:28,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.65998 samples/s/p 0:09:32 } +2024-07-30 06:01:31,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2722/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 4.8387644e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:31,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.65810 samples/s/p 0:09:29 } +2024-07-30 06:01:33,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2724/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 4.790902e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:33,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.65970 samples/s/p 0:09:26 } +2024-07-30 06:01:36,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2726/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 4.7433375e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:36,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.66126 samples/s/p 0:09:23 } +2024-07-30 06:01:39,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2728/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 4.6959517e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:39,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.65819 samples/s/p 0:09:21 } +2024-07-30 06:01:42,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2730/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 4.6488342e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:42,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.66009 samples/s/p 0:09:18 } +2024-07-30 06:01:45,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2732/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 4.601985e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:45,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.65918 samples/s/p 0:09:15 } +2024-07-30 06:01:48,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2734/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 4.5553147e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:48,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.65988 samples/s/p 0:09:12 } +2024-07-30 06:01:50,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2736/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 4.5088825e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:50,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.66007 samples/s/p 0:09:09 } +2024-07-30 06:01:53,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2738/ 3125], loss: 0.397, per_step_time: 1413ms, lr: 4.462689e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:53,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.66031 samples/s/p 0:09:06 } +2024-07-30 06:01:56,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2740/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 4.416764e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:56,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.66103 samples/s/p 0:09:04 } +2024-07-30 06:01:59,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2742/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 4.3710767e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:59,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.66023 samples/s/p 0:09:01 } +2024-07-30 06:02:02,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2744/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 4.3255984e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:02,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.66078 samples/s/p 0:08:58 } +2024-07-30 06:02:05,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2746/ 3125], loss: 0.068, per_step_time: 1412ms, lr: 4.2803883e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:05,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |███████████████████████████████████████████████ | 5.66230 samples/s/p 0:08:55 } +2024-07-30 06:02:07,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2748/ 3125], loss: 0.357, per_step_time: 1414ms, lr: 4.2353868e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:07,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |███████████████████████████████████████████████ | 5.65669 samples/s/p 0:08:53 } +2024-07-30 06:02:10,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2750/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 4.1906535e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:10,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.65916 samples/s/p 0:08:50 } +2024-07-30 06:02:13,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2752/ 3125], loss: 0.364, per_step_time: 1415ms, lr: 4.1461288e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:13,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.65302 samples/s/p 0:08:47 } +2024-07-30 06:02:16,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2754/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 4.1018424e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:16,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.66023 samples/s/p 0:08:44 } +2024-07-30 06:02:19,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2756/ 3125], loss: 0.309, per_step_time: 1414ms, lr: 4.0577948e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:19,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.65420 samples/s/p 0:08:42 } +2024-07-30 06:02:22,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2758/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 4.014015e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:22,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.66124 samples/s/p 0:08:38 } +2024-07-30 06:02:24,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2760/ 3125], loss: 0.477, per_step_time: 1414ms, lr: 3.9704442e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:24,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.65577 samples/s/p 0:08:36 } +2024-07-30 06:02:27,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2762/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 3.9270518e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:27,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.66113 samples/s/p 0:08:32 } +2024-07-30 06:02:30,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2764/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 3.8839875e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:30,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.66133 samples/s/p 0:08:30 } +2024-07-30 06:02:33,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2766/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 3.841102e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:33,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.66169 samples/s/p 0:08:27 } +2024-07-30 06:02:36,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2768/ 3125], loss: 0.448, per_step_time: 1413ms, lr: 3.7985146e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:36,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.66082 samples/s/p 0:08:24 } +2024-07-30 06:02:39,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2770/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 3.7561357e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:39,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.66109 samples/s/p 0:08:21 } +2024-07-30 06:02:41,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2772/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 3.7139653e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:41,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.66091 samples/s/p 0:08:18 } +2024-07-30 06:02:44,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2774/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 3.6720333e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:44,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.66089 samples/s/p 0:08:16 } +2024-07-30 06:02:47,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2776/ 3125], loss: 0.407, per_step_time: 1412ms, lr: 3.63034e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:47,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.66252 samples/s/p 0:08:13 } +2024-07-30 06:02:50,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2778/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 3.5889446e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:50,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.65965 samples/s/p 0:08:10 } +2024-07-30 06:02:53,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2780/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 3.5476685e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:53,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.66161 samples/s/p 0:08:07 } +2024-07-30 06:02:56,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2782/ 3125], loss: 0.459, per_step_time: 1414ms, lr: 3.5067497e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:56,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.65699 samples/s/p 0:08:05 } +2024-07-30 06:02:58,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2784/ 3125], loss: 0.311, per_step_time: 1415ms, lr: 3.46601e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:58,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.64986 samples/s/p 0:08:02 } +2024-07-30 06:03:01,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2786/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 3.4255386e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:01,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.65949 samples/s/p 0:07:59 } +2024-07-30 06:03:04,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2788/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 3.3852753e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:04,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.65859 samples/s/p 0:07:56 } +2024-07-30 06:03:07,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2790/ 3125], loss: 0.353, per_step_time: 1414ms, lr: 3.3452807e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:07,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.65697 samples/s/p 0:07:53 } +2024-07-30 06:03:10,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2792/ 3125], loss: 0.171, per_step_time: 1414ms, lr: 3.3054945e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:10,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.65719 samples/s/p 0:07:50 } +2024-07-30 06:03:13,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2794/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 3.265947e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:13,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.65964 samples/s/p 0:07:47 } +2024-07-30 06:03:15,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2796/ 3125], loss: 0.270, per_step_time: 1414ms, lr: 3.226608e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:15,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.65477 samples/s/p 0:07:45 } +2024-07-30 06:03:18,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2798/ 3125], loss: 0.333, per_step_time: 1414ms, lr: 3.187567e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:18,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.65723 samples/s/p 0:07:42 } +2024-07-30 06:03:21,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2800/ 3125], loss: 0.323, per_step_time: 1413ms, lr: 3.1487644e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:21,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.65838 samples/s/p 0:07:39 } +2024-07-30 06:03:24,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2802/ 3125], loss: 0.151, per_step_time: 1414ms, lr: 3.1101703e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:24,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.65653 samples/s/p 0:07:36 } +2024-07-30 06:03:27,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2804/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 3.071755e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:27,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.66070 samples/s/p 0:07:33 } +2024-07-30 06:03:30,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2806/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 3.033668e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:30,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.65903 samples/s/p 0:07:30 } +2024-07-30 06:03:32,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2808/ 3125], loss: 0.221, per_step_time: 1414ms, lr: 2.995759e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:32,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.65704 samples/s/p 0:07:28 } +2024-07-30 06:03:35,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2810/ 3125], loss: 0.115, per_step_time: 1413ms, lr: 2.9581486e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:35,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.66170 samples/s/p 0:07:25 } +2024-07-30 06:03:38,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2812/ 3125], loss: 0.130, per_step_time: 1413ms, lr: 2.920717e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:38,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.66063 samples/s/p 0:07:22 } +2024-07-30 06:03:41,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2814/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 2.8835236e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:41,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.66145 samples/s/p 0:07:19 } +2024-07-30 06:03:44,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2816/ 3125], loss: 0.315, per_step_time: 1412ms, lr: 2.8466582e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:44,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.66241 samples/s/p 0:07:16 } +2024-07-30 06:03:47,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2818/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 2.8099416e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:47,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.65935 samples/s/p 0:07:13 } +2024-07-30 06:03:49,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2820/ 3125], loss: 0.441, per_step_time: 1412ms, lr: 2.773434e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:49,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.66192 samples/s/p 0:07:10 } +2024-07-30 06:03:52,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2822/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 2.7372538e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:52,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.65894 samples/s/p 0:07:08 } +2024-07-30 06:03:55,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2824/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 2.7012526e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:55,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.65933 samples/s/p 0:07:05 } +2024-07-30 06:03:58,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2826/ 3125], loss: 0.407, per_step_time: 1413ms, lr: 2.6655197e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:58,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.65898 samples/s/p 0:07:02 } +2024-07-30 06:04:01,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2828/ 3125], loss: 0.230, per_step_time: 1414ms, lr: 2.6299952e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:01,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.65455 samples/s/p 0:07:00 } +2024-07-30 06:04:04,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2830/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 2.5947392e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:04,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.66168 samples/s/p 0:06:56 } +2024-07-30 06:04:06,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2832/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 2.5597213e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:06,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.66059 samples/s/p 0:06:54 } +2024-07-30 06:04:09,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2834/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 2.5248527e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:09,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.66076 samples/s/p 0:06:51 } +2024-07-30 06:04:12,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2836/ 3125], loss: 0.271, per_step_time: 1414ms, lr: 2.4903715e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:12,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.65737 samples/s/p 0:06:48 } +2024-07-30 06:04:15,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2838/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 2.4560093e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:15,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.65905 samples/s/p 0:06:45 } +2024-07-30 06:04:18,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2840/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 2.4219453e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:18,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.65656 samples/s/p 0:06:43 } +2024-07-30 06:04:21,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2842/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 2.3881196e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:21,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.65890 samples/s/p 0:06:40 } +2024-07-30 06:04:23,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2844/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 2.3544729e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:23,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.66128 samples/s/p 0:06:37 } +2024-07-30 06:04:26,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2846/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 2.3211241e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:26,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.65910 samples/s/p 0:06:34 } +2024-07-30 06:04:29,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2848/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 2.2880137e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:29,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.65781 samples/s/p 0:06:31 } +2024-07-30 06:04:32,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2850/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 2.255082e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:32,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.65984 samples/s/p 0:06:28 } +2024-07-30 06:04:35,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2852/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 2.2224187e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:35,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.65802 samples/s/p 0:06:26 } +2024-07-30 06:04:38,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2854/ 3125], loss: 0.231, per_step_time: 1414ms, lr: 2.1899938e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:38,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.65506 samples/s/p 0:06:23 } +2024-07-30 06:04:40,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2856/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 2.1578073e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:40,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.65824 samples/s/p 0:06:20 } +2024-07-30 06:04:43,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2858/ 3125], loss: 0.124, per_step_time: 1414ms, lr: 2.125889e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:43,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.65604 samples/s/p 0:06:17 } +2024-07-30 06:04:46,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2860/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 2.0941794e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:46,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.65820 samples/s/p 0:06:14 } +2024-07-30 06:04:49,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2862/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 2.0627379e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:49,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.65897 samples/s/p 0:06:11 } +2024-07-30 06:04:52,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2864/ 3125], loss: 0.192, per_step_time: 1419ms, lr: 2.0314753e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:52,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.63429 samples/s/p 0:06:10 } +2024-07-30 06:04:55,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2866/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 2.0005107e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:55,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.65789 samples/s/p 0:06:06 } +2024-07-30 06:04:57,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2868/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 1.9697248e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:57,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.65788 samples/s/p 0:06:03 } +2024-07-30 06:05:00,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2870/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 1.9392072e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:00,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.65963 samples/s/p 0:06:00 } +2024-07-30 06:05:03,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2872/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 1.908958e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:03,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.65961 samples/s/p 0:05:57 } +2024-07-30 06:05:06,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2874/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 1.8788874e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:06,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.66053 samples/s/p 0:05:54 } +2024-07-30 06:05:09,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2876/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 1.849085e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:09,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.65994 samples/s/p 0:05:51 } +2024-07-30 06:05:12,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2878/ 3125], loss: 0.268, per_step_time: 1414ms, lr: 1.819521e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:12,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.65714 samples/s/p 0:05:49 } +2024-07-30 06:05:14,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2880/ 3125], loss: 0.092, per_step_time: 1412ms, lr: 1.7902254e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:14,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.66179 samples/s/p 0:05:46 } +2024-07-30 06:05:17,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2882/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 1.7611086e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:17,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.66001 samples/s/p 0:05:43 } +2024-07-30 06:05:20,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2884/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 1.73226e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:20,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.66001 samples/s/p 0:05:40 } +2024-07-30 06:05:23,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2886/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 1.7036497e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:23,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.65948 samples/s/p 0:05:37 } +2024-07-30 06:05:26,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2888/ 3125], loss: 0.341, per_step_time: 1414ms, lr: 1.6752184e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:26,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.65677 samples/s/p 0:05:35 } +2024-07-30 06:05:29,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2890/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 1.6471148e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:29,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.66025 samples/s/p 0:05:32 } +2024-07-30 06:05:31,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2892/ 3125], loss: 0.404, per_step_time: 1414ms, lr: 1.6192198e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:31,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.65717 samples/s/p 0:05:29 } +2024-07-30 06:05:34,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2894/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 1.5915631e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:34,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.65945 samples/s/p 0:05:26 } +2024-07-30 06:05:37,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2896/ 3125], loss: 0.167, per_step_time: 1415ms, lr: 1.5641152e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:37,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.65297 samples/s/p 0:05:24 } +2024-07-30 06:05:40,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2898/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 1.5369654e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:40,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.66056 samples/s/p 0:05:20 } +2024-07-30 06:05:43,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2900/ 3125], loss: 0.129, per_step_time: 1413ms, lr: 1.5099644e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:43,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.65977 samples/s/p 0:05:18 } +2024-07-30 06:05:46,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2902/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 1.4832615e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:46,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.66033 samples/s/p 0:05:15 } +2024-07-30 06:05:48,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2904/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 1.4568269e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:48,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.65925 samples/s/p 0:05:12 } +2024-07-30 06:05:51,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2906/ 3125], loss: 0.186, per_step_time: 1414ms, lr: 1.4305412e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:51,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.65753 samples/s/p 0:05:09 } +2024-07-30 06:05:54,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2908/ 3125], loss: 0.381, per_step_time: 1414ms, lr: 1.4045536e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:54,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.65694 samples/s/p 0:05:06 } +2024-07-30 06:05:57,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2910/ 3125], loss: 0.063, per_step_time: 1413ms, lr: 1.3787746e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:57,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.65805 samples/s/p 0:05:03 } +2024-07-30 06:06:00,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2912/ 3125], loss: 0.152, per_step_time: 1424ms, lr: 1.35329365e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:00,310 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.61430 samples/s/p 0:05:03 } +2024-07-30 06:06:03,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2914/ 3125], loss: 0.210, per_step_time: 1412ms, lr: 1.3279915e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:03,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.66185 samples/s/p 0:04:58 } +2024-07-30 06:06:05,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2916/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 1.3029575e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:05,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.66008 samples/s/p 0:04:55 } +2024-07-30 06:06:08,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2918/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 1.2781322e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:08,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.65897 samples/s/p 0:04:52 } +2024-07-30 06:06:11,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2920/ 3125], loss: 0.135, per_step_time: 1420ms, lr: 1.253575e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:11,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.63357 samples/s/p 0:04:51 } +2024-07-30 06:06:14,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2922/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 1.2292862e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:14,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.65818 samples/s/p 0:04:47 } +2024-07-30 06:06:17,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2924/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 1.20517605e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:17,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.65994 samples/s/p 0:04:44 } +2024-07-30 06:06:20,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2926/ 3125], loss: 0.231, per_step_time: 1415ms, lr: 1.1813044e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:20,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.65174 samples/s/p 0:04:41 } +2024-07-30 06:06:23,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2928/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 1.1576712e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:23,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.65782 samples/s/p 0:04:38 } +2024-07-30 06:06:25,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2930/ 3125], loss: 0.466, per_step_time: 1413ms, lr: 1.1342763e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:25,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.66045 samples/s/p 0:04:35 } +2024-07-30 06:06:28,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2932/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 1.1111796e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:28,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.66072 samples/s/p 0:04:32 } +2024-07-30 06:06:31,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2934/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 1.0882616e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:31,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |████████████████████████████████████████████████ | 5.65680 samples/s/p 0:04:30 } +2024-07-30 06:06:34,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2936/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 1.0656118e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:34,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |████████████████████████████████████████████████ | 5.65881 samples/s/p 0:04:27 } +2024-07-30 06:06:37,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2938/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 1.0431707e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:37,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.65925 samples/s/p 0:04:24 } +2024-07-30 06:06:40,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2940/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 1.0209978e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:40,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.66156 samples/s/p 0:04:21 } +2024-07-30 06:06:42,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2942/ 3125], loss: 0.220, per_step_time: 1414ms, lr: 9.990334e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:42,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.65533 samples/s/p 0:04:18 } +2024-07-30 06:06:45,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2944/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 9.773076e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:45,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.65814 samples/s/p 0:04:15 } +2024-07-30 06:06:48,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2946/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 9.558499e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:48,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.65991 samples/s/p 0:04:13 } +2024-07-30 06:06:51,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2948/ 3125], loss: 0.209, per_step_time: 1414ms, lr: 9.346604e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:51,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.65534 samples/s/p 0:04:10 } +2024-07-30 06:06:54,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2950/ 3125], loss: 0.284, per_step_time: 1412ms, lr: 9.136498e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:54,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.66216 samples/s/p 0:04:07 } +2024-07-30 06:06:57,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2952/ 3125], loss: 0.452, per_step_time: 1413ms, lr: 8.9284775e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:57,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.65887 samples/s/p 0:04:04 } +2024-07-30 06:06:59,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2954/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 8.723438e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:59,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.65634 samples/s/p 0:04:01 } +2024-07-30 06:07:02,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2956/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 8.520781e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:02,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.65967 samples/s/p 0:03:58 } +2024-07-30 06:07:05,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2958/ 3125], loss: 0.130, per_step_time: 1414ms, lr: 8.320212e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:05,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.65505 samples/s/p 0:03:56 } +2024-07-30 06:07:08,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2960/ 3125], loss: 0.097, per_step_time: 1414ms, lr: 8.122623e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:08,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.65448 samples/s/p 0:03:53 } +2024-07-30 06:07:11,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2962/ 3125], loss: 0.430, per_step_time: 1413ms, lr: 7.926523e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:11,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.66089 samples/s/p 0:03:50 } +2024-07-30 06:07:14,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2964/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 7.733404e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:14,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.66151 samples/s/p 0:03:47 } +2024-07-30 06:07:16,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2966/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 7.542371e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:16,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.66111 samples/s/p 0:03:44 } +2024-07-30 06:07:19,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2968/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 7.354021e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:19,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.65974 samples/s/p 0:03:41 } +2024-07-30 06:07:22,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2970/ 3125], loss: 0.252, per_step_time: 1414ms, lr: 7.167458e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:22,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.65685 samples/s/p 0:03:39 } +2024-07-30 06:07:25,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2972/ 3125], loss: 0.431, per_step_time: 1414ms, lr: 6.983876e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:25,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.65743 samples/s/p 0:03:36 } +2024-07-30 06:07:28,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2974/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 6.802976e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:28,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.65871 samples/s/p 0:03:33 } +2024-07-30 06:07:31,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2976/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 6.623864e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:31,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.65980 samples/s/p 0:03:30 } +2024-07-30 06:07:33,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2978/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 6.447136e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:33,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.65964 samples/s/p 0:03:27 } +2024-07-30 06:07:36,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2980/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 6.2727925e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:36,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.65992 samples/s/p 0:03:24 } +2024-07-30 06:07:39,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2982/ 3125], loss: 0.104, per_step_time: 1413ms, lr: 6.101131e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:39,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.66001 samples/s/p 0:03:22 } +2024-07-30 06:07:42,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2984/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 5.931854e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:42,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.66027 samples/s/p 0:03:19 } +2024-07-30 06:07:45,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2986/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 5.764663e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:45,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.65952 samples/s/p 0:03:16 } +2024-07-30 06:07:48,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2988/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 5.600452e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:48,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.66014 samples/s/p 0:03:13 } +2024-07-30 06:07:50,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2990/ 3125], loss: 0.353, per_step_time: 1414ms, lr: 5.4374336e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:50,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.65763 samples/s/p 0:03:10 } +2024-07-30 06:07:53,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2992/ 3125], loss: 0.474, per_step_time: 1413ms, lr: 5.277693e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:53,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.65907 samples/s/p 0:03:08 } +2024-07-30 06:07:56,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2994/ 3125], loss: 0.334, per_step_time: 1413ms, lr: 5.120039e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:56,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.65907 samples/s/p 0:03:05 } +2024-07-30 06:07:59,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2996/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 4.965365e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:59,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.65949 samples/s/p 0:03:02 } +2024-07-30 06:08:02,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2998/ 3125], loss: 0.109, per_step_time: 1414ms, lr: 4.812181e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:02,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.65751 samples/s/p 0:02:59 } +2024-07-30 06:08:05,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3000/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 4.6625734e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:05,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.65810 samples/s/p 0:02:56 } +2024-07-30 06:08:07,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3002/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 4.5138595e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:07,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.65835 samples/s/p 0:02:53 } +2024-07-30 06:08:10,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3004/ 3125], loss: 0.333, per_step_time: 1414ms, lr: 4.3684243e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:10,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.65386 samples/s/p 0:02:51 } +2024-07-30 06:08:13,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3006/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 4.225373e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:13,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.65843 samples/s/p 0:02:48 } +2024-07-30 06:08:16,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3008/ 3125], loss: 0.352, per_step_time: 1414ms, lr: 4.0844084e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:16,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.65703 samples/s/p 0:02:45 } +2024-07-30 06:08:19,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3010/ 3125], loss: 0.381, per_step_time: 1413ms, lr: 3.946125e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:19,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.66010 samples/s/p 0:02:42 } +2024-07-30 06:08:22,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3012/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 3.809929e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:22,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.66154 samples/s/p 0:02:39 } +2024-07-30 06:08:24,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3014/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 3.6761163e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:24,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.65908 samples/s/p 0:02:36 } +2024-07-30 06:08:27,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3016/ 3125], loss: 0.283, per_step_time: 1412ms, lr: 3.544986e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:27,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.66206 samples/s/p 0:02:34 } +2024-07-30 06:08:30,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3018/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 3.4165382e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:30,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.66030 samples/s/p 0:02:31 } +2024-07-30 06:08:33,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3020/ 3125], loss: 0.203, per_step_time: 1412ms, lr: 3.2895802e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:33,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.66186 samples/s/p 0:02:28 } +2024-07-30 06:08:36,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3022/ 3125], loss: 0.099, per_step_time: 1415ms, lr: 3.1656027e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:36,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.65220 samples/s/p 0:02:25 } +2024-07-30 06:08:39,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3024/ 3125], loss: 0.406, per_step_time: 1413ms, lr: 3.043711e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:39,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.66029 samples/s/p 0:02:22 } +2024-07-30 06:08:41,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3026/ 3125], loss: 0.065, per_step_time: 1413ms, lr: 2.9245018e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:41,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.66098 samples/s/p 0:02:19 } +2024-07-30 06:08:44,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3028/ 3125], loss: 0.321, per_step_time: 1414ms, lr: 2.8073788e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:44,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.65615 samples/s/p 0:02:17 } +2024-07-30 06:08:47,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3030/ 3125], loss: 0.028, per_step_time: 1413ms, lr: 2.6926397e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:47,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.65935 samples/s/p 0:02:14 } +2024-07-30 06:08:50,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3032/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 2.580881e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:50,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.65911 samples/s/p 0:02:11 } +2024-07-30 06:08:53,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3034/ 3125], loss: 0.190, per_step_time: 1416ms, lr: 2.4709106e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:53,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.64704 samples/s/p 0:02:08 } +2024-07-30 06:08:56,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3036/ 3125], loss: 0.496, per_step_time: 1413ms, lr: 2.3639202e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:56,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.65803 samples/s/p 0:02:05 } +2024-07-30 06:08:58,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3038/ 3125], loss: 0.532, per_step_time: 1414ms, lr: 2.2587179e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:58,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.65403 samples/s/p 0:02:03 } +2024-07-30 06:09:01,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3040/ 3125], loss: 0.358, per_step_time: 1412ms, lr: 2.155602e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:01,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.66223 samples/s/p 0:02:00 } +2024-07-30 06:09:04,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3042/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 2.0557642e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:04,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.65860 samples/s/p 0:01:57 } +2024-07-30 06:09:07,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3044/ 3125], loss: 0.201, per_step_time: 1414ms, lr: 1.9577144e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:07,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.65542 samples/s/p 0:01:54 } +2024-07-30 06:09:10,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3046/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 1.8620491e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:10,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.65845 samples/s/p 0:01:51 } +2024-07-30 06:09:13,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3048/ 3125], loss: 0.417, per_step_time: 1417ms, lr: 1.7693639e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:13,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.64520 samples/s/p 0:01:49 } +2024-07-30 06:09:15,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3050/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 1.6784667e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:15,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.65879 samples/s/p 0:01:46 } +2024-07-30 06:09:18,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3052/ 3125], loss: 0.300, per_step_time: 1415ms, lr: 1.5902519e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:18,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.65257 samples/s/p 0:01:43 } +2024-07-30 06:09:21,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3054/ 3125], loss: 0.165, per_step_time: 1414ms, lr: 1.5044211e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:21,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.65723 samples/s/p 0:01:40 } +2024-07-30 06:09:24,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3056/ 3125], loss: 0.212, per_step_time: 1412ms, lr: 1.4206767e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:24,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.66204 samples/s/p 0:01:37 } +2024-07-30 06:09:27,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3058/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 1.3396143e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:27,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.65868 samples/s/p 0:01:34 } +2024-07-30 06:09:30,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3060/ 3125], loss: 0.296, per_step_time: 1412ms, lr: 1.2612342e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:30,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.66255 samples/s/p 0:01:31 } +2024-07-30 06:09:32,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3062/ 3125], loss: 0.255, per_step_time: 1414ms, lr: 1.1846423e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:32,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.65408 samples/s/p 0:01:29 } +2024-07-30 06:09:35,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3064/ 3125], loss: 0.113, per_step_time: 1413ms, lr: 1.1107325e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:35,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.66108 samples/s/p 0:01:26 } +2024-07-30 06:09:38,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3066/ 3125], loss: 0.314, per_step_time: 1412ms, lr: 1.038909e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:38,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.66189 samples/s/p 0:01:23 } +2024-07-30 06:09:41,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3068/ 3125], loss: 0.279, per_step_time: 1414ms, lr: 9.694695e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:41,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.65749 samples/s/p 0:01:20 } +2024-07-30 06:09:44,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3070/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 9.0271235e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:44,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.66085 samples/s/p 0:01:17 } +2024-07-30 06:09:47,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3072/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 8.380413e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:47,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.65876 samples/s/p 0:01:14 } +2024-07-30 06:09:49,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3074/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 7.7605244e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:49,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.66028 samples/s/p 0:01:12 } +2024-07-30 06:09:52,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3076/ 3125], loss: 0.150, per_step_time: 1412ms, lr: 7.161498e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:52,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.66204 samples/s/p 0:01:09 } +2024-07-30 06:09:55,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3078/ 3125], loss: 0.324, per_step_time: 1414ms, lr: 6.595254e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:55,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.65739 samples/s/p 0:01:06 } +2024-07-30 06:09:58,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3080/ 3125], loss: 0.265, per_step_time: 1414ms, lr: 6.043911e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:58,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.65574 samples/s/p 0:01:03 } +2024-07-30 06:10:01,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3082/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 5.5164096e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:01,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.65777 samples/s/p 0:01:00 } +2024-07-30 06:10:04,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3084/ 3125], loss: 0.305, per_step_time: 1415ms, lr: 5.0157306e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:04,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.65370 samples/s/p 0:00:58 } +2024-07-30 06:10:06,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3086/ 3125], loss: 0.515, per_step_time: 1419ms, lr: 4.5418738e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:06,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.63755 samples/s/p 0:00:55 } +2024-07-30 06:10:09,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3088/ 3125], loss: 0.140, per_step_time: 1415ms, lr: 4.0858983e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:09,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.65056 samples/s/p 0:00:52 } +2024-07-30 06:10:12,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3090/ 3125], loss: 0.113, per_step_time: 1414ms, lr: 3.6537645e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:12,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.65622 samples/s/p 0:00:49 } +2024-07-30 06:10:15,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3092/ 3125], loss: 0.268, per_step_time: 1414ms, lr: 3.2514333e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:15,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.65388 samples/s/p 0:00:46 } +2024-07-30 06:10:18,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3094/ 3125], loss: 0.468, per_step_time: 1413ms, lr: 2.8669833e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:18,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.66044 samples/s/p 0:00:43 } +2024-07-30 06:10:21,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3096/ 3125], loss: 0.111, per_step_time: 1412ms, lr: 2.5063754e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:21,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.66179 samples/s/p 0:00:40 } +2024-07-30 06:10:23,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3098/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 2.1785497e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:23,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.65991 samples/s/p 0:00:38 } +2024-07-30 06:10:26,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3100/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 1.8656253e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:26,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.65953 samples/s/p 0:00:35 } +2024-07-30 06:10:29,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3102/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 1.5825033e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:29,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.65905 samples/s/p 0:00:32 } +2024-07-30 06:10:32,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3104/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 1.3172625e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:32,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.66112 samples/s/p 0:00:29 } +2024-07-30 06:10:35,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3106/ 3125], loss: 0.294, per_step_time: 1412ms, lr: 1.0818243e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:35,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.66255 samples/s/p 0:00:26 } +2024-07-30 06:10:38,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3108/ 3125], loss: 0.070, per_step_time: 1413ms, lr: 8.612871e-11, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:38,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.66037 samples/s/p 0:00:24 } +2024-07-30 06:10:40,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3110/ 3125], loss: 0.126, per_step_time: 1425ms, lr: 6.705522e-11, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:40,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.61086 samples/s/p 0:00:21 } +2024-07-30 06:10:43,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3112/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 5.0663945e-11, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:43,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.65913 samples/s/p 0:00:18 } +2024-07-30 06:10:46,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3114/ 3125], loss: 0.175, per_step_time: 1414ms, lr: 3.606081e-11, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:46,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.65557 samples/s/p 0:00:15 } +2024-07-30 06:10:49,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3116/ 3125], loss: 0.208, per_step_time: 1415ms, lr: 2.3841857e-11, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:49,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.65297 samples/s/p 0:00:12 } +2024-07-30 06:10:52,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3118/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 1.4603138e-11, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:52,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.65994 samples/s/p 0:00:09 } +2024-07-30 06:10:55,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3120/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 7.45058e-12, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:55,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.65803 samples/s/p 0:00:07 } +2024-07-30 06:10:57,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3122/ 3125], loss: 0.388, per_step_time: 1414ms, lr: 2.682209e-12, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:57,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |█████████████████████████████████████████████████ | 5.65682 samples/s/p 0:00:04 } +2024-07-30 06:11:00,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3124/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 2.9802322e-13, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:11:00,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |█████████████████████████████████████████████████ | 5.65811 samples/s/p 0:00:01 } +2024-07-30 06:11:00,843 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 06:11:33,108 - mindformers[mindformers/trainer/base_trainer.py:779] - INFO - .........Training Over!............. diff --git "a/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/2. \345\276\256\350\260\203\346\227\245\345\277\227\344\270\216\351\205\215\347\275\256/finetune_msrun_log/worker_2.log" "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/2. \345\276\256\350\260\203\346\227\245\345\277\227\344\270\216\351\205\215\347\275\256/finetune_msrun_log/worker_2.log" new file mode 100644 index 00000000..155d031c --- /dev/null +++ "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/2. \345\276\256\350\260\203\346\227\245\345\277\227\344\270\216\351\205\215\347\275\256/finetune_msrun_log/worker_2.log" @@ -0,0 +1,10017 @@ +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:499: UserWarning: The value of the smallest subnormal for type is zero. + setattr(self, word, getattr(machar, word).flat[0]) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:89: UserWarning: The value of the smallest subnormal for type is zero. + return self._float_to_str(self.smallest_subnormal) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:499: UserWarning: The value of the smallest subnormal for type is zero. + setattr(self, word, getattr(machar, word).flat[0]) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:89: UserWarning: The value of the smallest subnormal for type is zero. + return self._float_to_str(self.smallest_subnormal) +[WARNING] DISTRIBUTED(978993,ffffa1546010,python):2024-07-30-02:07:40.889.599 [mindspore/ccsrc/distributed/rpc/tcp/tcp_comm.cc:464] Connect] Waiting for the state of the connection to 127.0.0.1:8118 to be connected...Retry number: 1 +[WARNING] DISTRIBUTED(978993,ffffa1546010,python):2024-07-30-02:07:41.890.321 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:194] BuildCluster] Topology build timed out., retry(1/200). +[WARNING] DISTRIBUTED(978993,ffffa1546010,python):2024-07-30-02:07:44.890.489 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:194] BuildCluster] Topology build timed out., retry(2/200). +[WARNING] DISTRIBUTED(978993,ffffa1546010,python):2024-07-30-02:07:47.890.687 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:196] BuildCluster] Cluster is successfully initialized. +[WARNING] DISTRIBUTED(978993,ffffa1546010,python):2024-07-30-02:07:47.891.026 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:260] PostProcess] This node 2 rank id: 2 +[WARNING] DISTRIBUTED(978993,ffffa1546010,python):2024-07-30-02:08:12.330.489 [mindspore/ccsrc/distributed/collective/collective_manager.cc:259] CreateCommunicationGroup] Start to create communication group: hccl_world_group [const vector]{0, 1, 2, 3} +[WARNING] DISTRIBUTED(978993,ffffa1546010,python):2024-07-30-02:08:12.331.103 [mindspore/ccsrc/distributed/collective/collective_manager.cc:335] CreateCommunicationGroup] Begin initialize communication group on the device side: hccl_world_group +[WARNING] DISTRIBUTED(978993,ffffa1546010,python):2024-07-30-02:08:14.444.181 [mindspore/ccsrc/distributed/collective/collective_manager.cc:345] CreateCommunicationGroup] End initialize communication group on the device side: hccl_world_group +2024-07-30 02:08:14,447 - mindformers[mindformers/tools/utils.py:168] - INFO - set strategy path to './output/strategy/ckpt_strategy_rank_2.ckpt' +2024-07-30 02:08:14,481 - mindformers[mindformers/trainer/trainer.py:919] - INFO - Load configs in /home/ma-user/work/mindformers/configs/gpt2/run_gpt2.yaml to build trainer. +2024-07-30 02:08:14,481 - mindformers[mindformers/trainer/trainer.py:949] - INFO - ..........Init Config.......... +2024-07-30 02:08:14,481 - mindformers[mindformers/core/parallel_config.py:45] - INFO - initial recompute_config from dict: {'recompute': True, 'select_recompute': False, 'parallel_optimizer_comm_recompute': False, 'mp_comm_recompute': True, 'recompute_slice_activation': True} +2024-07-30 02:08:14,482 - mindformers[mindformers/core/parallel_config.py:51] - INFO - initial parallel_config from dict: {'data_parallel': 1, 'model_parallel': 4, 'pipeline_stage': 1, 'use_seq_parallel': False, 'micro_batch_num': 1, 'vocab_emb_dp': True, 'gradient_aggregation_group': 4} +2024-07-30 02:08:14,482 - mindformers[mindformers/tools/utils.py:153] - INFO - set output path to '/home/ma-user/work/mindformers/research/output' +2024-07-30 02:08:14,483 - mindformers[mindformers/trainer/base_trainer.py:85] - INFO - Now Running Task is: text_generation, Model is: llama3_8b +2024-07-30 02:08:14,483 - mindformers[mindformers/trainer/base_trainer.py:111] - WARNING - Input model name is not in the supported list or unspecified. +2024-07-30 02:08:14,483 - mindformers[mindformers/trainer/base_trainer.py:112] - WARNING - See the list of supported task and model name: ['baichuan2_13b', 'baichuan2_7b', 'baichuan_7b', 'bloom_176b', 'bloom_560m', 'bloom_65b', 'bloom_7.1b', 'codegeex2_6b', 'codellama_34b', 'common', 'deepseek_33b', 'glm2_6b', 'glm2_6b_lora', 'glm2_6b_ptuning2', 'glm3_6b', 'glm_6b', 'glm_6b_chat', 'glm_6b_lora', 'glm_6b_lora_chat', 'gpt2', 'gpt2_13b', 'gpt2_52b', 'gpt2_lora', 'gpt2_xl', 'gpt2_xl_lora', 'internlm_7b', 'internlm_7b_lora', 'llama2_13b', 'llama2_70b', 'llama2_7b', 'llama_13b', 'llama_65b', 'llama_7b', 'llama_7b_lora', 'pangualpha_13b', 'pangualpha_2_6b', 'qwen_7b', 'qwen_7b_lora', 'skywork_13b', 'yi_34b', 'yi_6b', 'ziya_13b'] +2024-07-30 02:08:14,484 - mindformers[mindformers/trainer/base_trainer.py:113] - WARNING - The default model config: /home/ma-user/work/mindformers/configs/gpt2/run_gpt2.yaml will now be used for the text_generation task +2024-07-30 02:08:14,484 - mindformers[mindformers/trainer/trainer.py:1004] - INFO - ..........Init Model.......... +2024-07-30 02:08:14,484 - mindformers[mindformers/trainer/trainer.py:1027] - INFO - ..........Init Train Dataset.......... +2024-07-30 02:08:14,484 - mindformers[mindformers/trainer/trainer.py:335] - INFO - ==========Trainer Init Success!========== +2024-07-30 02:08:14,484 - mindformers[mindformers/trainer/trainer.py:476] - WARNING - The `finetune_checkpoint` will be deprecated. Please use `resume_from_checkpoint` instead. +2024-07-30 02:08:14,485 - mindformers[mindformers/trainer/trainer.py:1004] - INFO - ..........Init Model.......... +2024-07-30 02:08:14,485 - mindformers[mindformers/trainer/base_trainer.py:176] - INFO - The current parallel mode is semi_auto_parallel, full batch is True,so global batch size will be changed: global_batch_size = batch_size * data_parallel * micro_batch_interleave_num * gradient_accumulation_steps = 32 = 32 * 1 * 1 * 1 +2024-07-30 02:08:14,485 - mindformers[mindformers/trainer/base_trainer.py:624] - INFO - .........Build Dataset For Train.......... +2024-07-30 02:08:14,485 - mindformers[mindformers/trainer/base_trainer.py:353] - INFO - .........Build Dataset From Config.......... +2024-07-30 02:08:14,486 - mindformers[mindformers/dataset/causal_language_model_dataset.py:166] - INFO - Now Create Causal Language Model Dataset. +2024-07-30 02:08:14,496 - mindformers[mindformers/trainer/base_trainer.py:626] - INFO - Create train dataset finish, dataset size:3125 +2024-07-30 02:08:14,496 - mindformers[mindformers/trainer/utils.py:171] - INFO - Will be Training epochs:3, sink_size:2 +2024-07-30 02:08:14,496 - mindformers[mindformers/trainer/utils.py:173] - INFO - Create training dataset finish, dataset size:3125 +2024-07-30 02:08:14,497 - mindformers[mindformers/trainer/base_trainer.py:656] - INFO - .........Build Net For Train.......... +2024-07-30 02:08:14,497 - mindformers[mindformers/trainer/base_trainer.py:387] - INFO - .........Build Network From Config.......... +2024-07-30 02:08:14,498 - mindformers[mindformers/version_control.py:61] - INFO - The Cell Reuse compilation acceleration feature is not supported when the environment variable ENABLE_CELL_REUSE is 0 or MindSpore version is earlier than 2.1.0 or stand_alone mode or pipeline_stages <= 1 +2024-07-30 02:08:14,498 - mindformers[mindformers/version_control.py:65] - INFO - +The current ENABLE_CELL_REUSE=0, please set the environment variable as follows: +export ENABLE_CELL_REUSE=1 to enable the Cell Reuse compilation acceleration feature. +2024-07-30 02:08:14,498 - mindformers[mindformers/version_control.py:74] - INFO - The Cell Reuse compilation acceleration feature only works in pipeline parallel mode(pipeline_stage>1).Current pipeline stage=1, the feature is disabled by default. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:08:14.500.419 [/home/ma-user/work/mindformers/mindformers/modules/transformer/op_parallel_config.py:244] The optimizer shard True in auto_parallel_context is not equal to the optimizer_shard None in the OpParallelConfig. Please check the optimizer_shard to make them consistent. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:08:14.503.027 [/home/ma-user/work/mindformers/mindformers/modules/transformer/op_parallel_config.py:244] The optimizer shard True in auto_parallel_context is not equal to the optimizer_shard None in the OpParallelConfig. Please check the optimizer_shard to make them consistent. +2024-07-30 02:08:14,608 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:08:14.610.157 [mindspore/common/_decorator.py:40] 'Parameter' is deprecated from version 2.3 and will be removed in a future version, use 'add_pipeline_stage' instead. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:08:14.610.288 [mindspore/common/parameter.py:806] This interface may be deleted in the future. +2024-07-30 02:08:14,629 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,650 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,670 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,690 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,710 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,731 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,751 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,772 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,793 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:15,253 - mindformers[mindformers/models/modeling_utils.py:1438] - INFO - model built, but weights is unloaded, since the config has no checkpoint_name_or_path attribute or checkpoint_name_or_path is None. +2024-07-30 02:08:15,443 - mindformers[mindformers/models/modeling_utils.py:1438] - INFO - model built, but weights is unloaded, since the config has no checkpoint_name_or_path attribute or checkpoint_name_or_path is None. +2024-07-30 02:08:15,466 - mindformers[mindformers/trainer/base_trainer.py:543] - INFO - Network Parameters: 3407872. +2024-07-30 02:08:15,466 - mindformers[mindformers/trainer/base_trainer.py:678] - INFO - .........Build Optimizer For Train.......... +2024-07-30 02:08:15,466 - mindformers[mindformers/trainer/base_trainer.py:426] - INFO - .........Build Optimizer From Config.......... +2024-07-30 02:08:15,466 - mindformers[mindformers/trainer/base_trainer.py:459] - INFO - .........Build LR Schedule From Config.......... +2024-07-30 02:08:15,472 - mindformers[mindformers/trainer/optimizer_grouped_parameters.py:74] - WARNING - dynamic_lr_schedule will be reset and invalid when layer_scale is False. +2024-07-30 02:08:15,476 - mindformers[mindformers/trainer/optimizer_grouped_parameters.py:113] - INFO - Param groups = { + "decay": { + "weight_decay": 0.0, + "params": [ + "model.layers.0.attention.wq.mindpet_delta_lora_a", + "model.layers.0.attention.wq.mindpet_delta_lora_b", + "model.layers.0.attention.wv.mindpet_delta_lora_a", + "model.layers.0.attention.wv.mindpet_delta_lora_b", + "model.layers.1.attention.wq.mindpet_delta_lora_a", + "model.layers.1.attention.wq.mindpet_delta_lora_b", + "model.layers.1.attention.wv.mindpet_delta_lora_a", + "model.layers.1.attention.wv.mindpet_delta_lora_b", + "model.layers.2.attention.wq.mindpet_delta_lora_a", + "model.layers.2.attention.wq.mindpet_delta_lora_b", + "model.layers.2.attention.wv.mindpet_delta_lora_a", + "model.layers.2.attention.wv.mindpet_delta_lora_b", + "model.layers.3.attention.wq.mindpet_delta_lora_a", + "model.layers.3.attention.wq.mindpet_delta_lora_b", + "model.layers.3.attention.wv.mindpet_delta_lora_a", + "model.layers.3.attention.wv.mindpet_delta_lora_b", + "model.layers.4.attention.wq.mindpet_delta_lora_a", + "model.layers.4.attention.wq.mindpet_delta_lora_b", + "model.layers.4.attention.wv.mindpet_delta_lora_a", + "model.layers.4.attention.wv.mindpet_delta_lora_b", + "model.layers.5.attention.wq.mindpet_delta_lora_a", + "model.layers.5.attention.wq.mindpet_delta_lora_b", + "model.layers.5.attention.wv.mindpet_delta_lora_a", + "model.layers.5.attention.wv.mindpet_delta_lora_b", + "model.layers.6.attention.wq.mindpet_delta_lora_a", + "model.layers.6.attention.wq.mindpet_delta_lora_b", + "model.layers.6.attention.wv.mindpet_delta_lora_a", + "model.layers.6.attention.wv.mindpet_delta_lora_b", + "model.layers.7.attention.wq.mindpet_delta_lora_a", + "model.layers.7.attention.wq.mindpet_delta_lora_b", + "model.layers.7.attention.wv.mindpet_delta_lora_a", + "model.layers.7.attention.wv.mindpet_delta_lora_b", + "model.layers.8.attention.wq.mindpet_delta_lora_a", + "model.layers.8.attention.wq.mindpet_delta_lora_b", + "model.layers.8.attention.wv.mindpet_delta_lora_a", + "model.layers.8.attention.wv.mindpet_delta_lora_b", + "model.layers.9.attention.wq.mindpet_delta_lora_a", + "model.layers.9.attention.wq.mindpet_delta_lora_b", + "model.layers.9.attention.wv.mindpet_delta_lora_a", + "model.layers.9.attention.wv.mindpet_delta_lora_b", + "model.layers.10.attention.wq.mindpet_delta_lora_a", + "model.layers.10.attention.wq.mindpet_delta_lora_b", + "model.layers.10.attention.wv.mindpet_delta_lora_a", + "model.layers.10.attention.wv.mindpet_delta_lora_b", + "model.layers.11.attention.wq.mindpet_delta_lora_a", + "model.layers.11.attention.wq.mindpet_delta_lora_b", + "model.layers.11.attention.wv.mindpet_delta_lora_a", + "model.layers.11.attention.wv.mindpet_delta_lora_b", + "model.layers.12.attention.wq.mindpet_delta_lora_a", + "model.layers.12.attention.wq.mindpet_delta_lora_b", + "model.layers.12.attention.wv.mindpet_delta_lora_a", + "model.layers.12.attention.wv.mindpet_delta_lora_b", + "model.layers.13.attention.wq.mindpet_delta_lora_a", + "model.layers.13.attention.wq.mindpet_delta_lora_b", + "model.layers.13.attention.wv.mindpet_delta_lora_a", + "model.layers.13.attention.wv.mindpet_delta_lora_b", + "model.layers.14.attention.wq.mindpet_delta_lora_a", + "model.layers.14.attention.wq.mindpet_delta_lora_b", + "model.layers.14.attention.wv.mindpet_delta_lora_a", + "model.layers.14.attention.wv.mindpet_delta_lora_b", + "model.layers.15.attention.wq.mindpet_delta_lora_a", + "model.layers.15.attention.wq.mindpet_delta_lora_b", + "model.layers.15.attention.wv.mindpet_delta_lora_a", + "model.layers.15.attention.wv.mindpet_delta_lora_b", + "model.layers.16.attention.wq.mindpet_delta_lora_a", + "model.layers.16.attention.wq.mindpet_delta_lora_b", + "model.layers.16.attention.wv.mindpet_delta_lora_a", + "model.layers.16.attention.wv.mindpet_delta_lora_b", + "model.layers.17.attention.wq.mindpet_delta_lora_a", + "model.layers.17.attention.wq.mindpet_delta_lora_b", + "model.layers.17.attention.wv.mindpet_delta_lora_a", + "model.layers.17.attention.wv.mindpet_delta_lora_b", + "model.layers.18.attention.wq.mindpet_delta_lora_a", + "model.layers.18.attention.wq.mindpet_delta_lora_b", + "model.layers.18.attention.wv.mindpet_delta_lora_a", + "model.layers.18.attention.wv.mindpet_delta_lora_b", + "model.layers.19.attention.wq.mindpet_delta_lora_a", + "model.layers.19.attention.wq.mindpet_delta_lora_b", + "model.layers.19.attention.wv.mindpet_delta_lora_a", + "model.layers.19.attention.wv.mindpet_delta_lora_b", + "model.layers.20.attention.wq.mindpet_delta_lora_a", + "model.layers.20.attention.wq.mindpet_delta_lora_b", + "model.layers.20.attention.wv.mindpet_delta_lora_a", + "model.layers.20.attention.wv.mindpet_delta_lora_b", + "model.layers.21.attention.wq.mindpet_delta_lora_a", + "model.layers.21.attention.wq.mindpet_delta_lora_b", + "model.layers.21.attention.wv.mindpet_delta_lora_a", + "model.layers.21.attention.wv.mindpet_delta_lora_b", + "model.layers.22.attention.wq.mindpet_delta_lora_a", + "model.layers.22.attention.wq.mindpet_delta_lora_b", + "model.layers.22.attention.wv.mindpet_delta_lora_a", + "model.layers.22.attention.wv.mindpet_delta_lora_b", + "model.layers.23.attention.wq.mindpet_delta_lora_a", + "model.layers.23.attention.wq.mindpet_delta_lora_b", + "model.layers.23.attention.wv.mindpet_delta_lora_a", + "model.layers.23.attention.wv.mindpet_delta_lora_b", + "model.layers.24.attention.wq.mindpet_delta_lora_a", + "model.layers.24.attention.wq.mindpet_delta_lora_b", + "model.layers.24.attention.wv.mindpet_delta_lora_a", + "model.layers.24.attention.wv.mindpet_delta_lora_b", + "model.layers.25.attention.wq.mindpet_delta_lora_a", + "model.layers.25.attention.wq.mindpet_delta_lora_b", + "model.layers.25.attention.wv.mindpet_delta_lora_a", + "model.layers.25.attention.wv.mindpet_delta_lora_b", + "model.layers.26.attention.wq.mindpet_delta_lora_a", + "model.layers.26.attention.wq.mindpet_delta_lora_b", + "model.layers.26.attention.wv.mindpet_delta_lora_a", + "model.layers.26.attention.wv.mindpet_delta_lora_b", + "model.layers.27.attention.wq.mindpet_delta_lora_a", + "model.layers.27.attention.wq.mindpet_delta_lora_b", + "model.layers.27.attention.wv.mindpet_delta_lora_a", + "model.layers.27.attention.wv.mindpet_delta_lora_b", + "model.layers.28.attention.wq.mindpet_delta_lora_a", + "model.layers.28.attention.wq.mindpet_delta_lora_b", + "model.layers.28.attention.wv.mindpet_delta_lora_a", + "model.layers.28.attention.wv.mindpet_delta_lora_b", + "model.layers.29.attention.wq.mindpet_delta_lora_a", + "model.layers.29.attention.wq.mindpet_delta_lora_b", + "model.layers.29.attention.wv.mindpet_delta_lora_a", + "model.layers.29.attention.wv.mindpet_delta_lora_b", + "model.layers.30.attention.wq.mindpet_delta_lora_a", + "model.layers.30.attention.wq.mindpet_delta_lora_b", + "model.layers.30.attention.wv.mindpet_delta_lora_a", + "model.layers.30.attention.wv.mindpet_delta_lora_b", + "model.layers.31.attention.wq.mindpet_delta_lora_a", + "model.layers.31.attention.wq.mindpet_delta_lora_b", + "model.layers.31.attention.wv.mindpet_delta_lora_a", + "model.layers.31.attention.wv.mindpet_delta_lora_b" + ] + } +} +2024-07-30 02:08:15,573 - mindformers[mindformers/trainer/base_trainer.py:683] - INFO - .........Build Running Wrapper From Config For Train.......... +2024-07-30 02:08:15,573 - mindformers[mindformers/trainer/base_trainer.py:496] - INFO - .........Build Model Wrapper for Train From Config.......... +2024-07-30 02:08:15,579 - mindformers[mindformers/trainer/base_trainer.py:687] - INFO - .........Build Callbacks For Train.......... +2024-07-30 02:08:15,581 - mindformers[mindformers/core/callback/callback.py:533] - INFO - Integrated_save is changed to False when using auto_parallel. +2024-07-30 02:08:15,582 - mindformers[mindformers/trainer/base_trainer.py:721] - INFO - .........Starting Init Train Model.......... +2024-07-30 02:08:15,583 - mindformers[mindformers/trainer/utils.py:736] - INFO - ............Start load checkpoint from checkpoint............ +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:08.296.015 [mindspore/train/serialization.py:1369] model.tok_embeddings.embedding_weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:13.489.424 [mindspore/train/serialization.py:1369] model.layers.0.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:13.490.416 [mindspore/train/serialization.py:1369] model.layers.0.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:13.490.945 [mindspore/train/serialization.py:1369] model.layers.0.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:13.674.786 [mindspore/train/serialization.py:1369] model.layers.0.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:13.719.662 [mindspore/train/serialization.py:1369] model.layers.0.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:13.759.017 [mindspore/train/serialization.py:1369] model.layers.0.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:13.908.812 [mindspore/train/serialization.py:1369] model.layers.0.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:14.496.062 [mindspore/train/serialization.py:1369] model.layers.0.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:15.705.32 [mindspore/train/serialization.py:1369] model.layers.0.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:15.631.485 [mindspore/train/serialization.py:1369] model.layers.1.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:15.632.278 [mindspore/train/serialization.py:1369] model.layers.1.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:15.632.736 [mindspore/train/serialization.py:1369] model.layers.1.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:15.784.248 [mindspore/train/serialization.py:1369] model.layers.1.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:15.826.200 [mindspore/train/serialization.py:1369] model.layers.1.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:15.867.395 [mindspore/train/serialization.py:1369] model.layers.1.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:16.222.32 [mindspore/train/serialization.py:1369] model.layers.1.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:16.594.410 [mindspore/train/serialization.py:1369] model.layers.1.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:17.162.863 [mindspore/train/serialization.py:1369] model.layers.1.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:17.746.711 [mindspore/train/serialization.py:1369] model.layers.2.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:17.747.471 [mindspore/train/serialization.py:1369] model.layers.2.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:17.747.900 [mindspore/train/serialization.py:1369] model.layers.2.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:17.902.058 [mindspore/train/serialization.py:1369] model.layers.2.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:17.949.612 [mindspore/train/serialization.py:1369] model.layers.2.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:17.991.061 [mindspore/train/serialization.py:1369] model.layers.2.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:18.145.384 [mindspore/train/serialization.py:1369] model.layers.2.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:18.730.408 [mindspore/train/serialization.py:1369] model.layers.2.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:19.302.036 [mindspore/train/serialization.py:1369] model.layers.2.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:19.870.322 [mindspore/train/serialization.py:1369] model.layers.3.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:19.871.154 [mindspore/train/serialization.py:1369] model.layers.3.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:19.871.603 [mindspore/train/serialization.py:1369] model.layers.3.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:20.370.90 [mindspore/train/serialization.py:1369] model.layers.3.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:20.806.67 [mindspore/train/serialization.py:1369] model.layers.3.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:20.121.027 [mindspore/train/serialization.py:1369] model.layers.3.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:20.280.381 [mindspore/train/serialization.py:1369] model.layers.3.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:20.846.460 [mindspore/train/serialization.py:1369] model.layers.3.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:21.444.435 [mindspore/train/serialization.py:1369] model.layers.3.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:22.703.70 [mindspore/train/serialization.py:1369] model.layers.4.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:22.712.01 [mindspore/train/serialization.py:1369] model.layers.4.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:22.716.29 [mindspore/train/serialization.py:1369] model.layers.4.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:22.233.249 [mindspore/train/serialization.py:1369] model.layers.4.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:22.271.006 [mindspore/train/serialization.py:1369] model.layers.4.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:22.362.085 [mindspore/train/serialization.py:1369] model.layers.4.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:22.522.673 [mindspore/train/serialization.py:1369] model.layers.4.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:23.106.167 [mindspore/train/serialization.py:1369] model.layers.4.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:23.664.457 [mindspore/train/serialization.py:1369] model.layers.4.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:24.226.769 [mindspore/train/serialization.py:1369] model.layers.5.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:24.227.789 [mindspore/train/serialization.py:1369] model.layers.5.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:24.228.307 [mindspore/train/serialization.py:1369] model.layers.5.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:24.393.178 [mindspore/train/serialization.py:1369] model.layers.5.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:24.432.830 [mindspore/train/serialization.py:1369] model.layers.5.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:24.473.996 [mindspore/train/serialization.py:1369] model.layers.5.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:24.647.141 [mindspore/train/serialization.py:1369] model.layers.5.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:25.216.406 [mindspore/train/serialization.py:1369] model.layers.5.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:25.818.492 [mindspore/train/serialization.py:1369] model.layers.5.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:26.376.283 [mindspore/train/serialization.py:1369] model.layers.6.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:26.377.151 [mindspore/train/serialization.py:1369] model.layers.6.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:26.377.624 [mindspore/train/serialization.py:1369] model.layers.6.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:26.544.389 [mindspore/train/serialization.py:1369] model.layers.6.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:26.615.412 [mindspore/train/serialization.py:1369] model.layers.6.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:26.702.152 [mindspore/train/serialization.py:1369] model.layers.6.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:26.880.276 [mindspore/train/serialization.py:1369] model.layers.6.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:27.499.703 [mindspore/train/serialization.py:1369] model.layers.6.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:28.128.812 [mindspore/train/serialization.py:1369] model.layers.6.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:28.768.703 [mindspore/train/serialization.py:1369] model.layers.7.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:28.769.785 [mindspore/train/serialization.py:1369] model.layers.7.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:28.770.403 [mindspore/train/serialization.py:1369] model.layers.7.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:28.950.104 [mindspore/train/serialization.py:1369] model.layers.7.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:29.616.18 [mindspore/train/serialization.py:1369] model.layers.7.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:29.116.522 [mindspore/train/serialization.py:1369] model.layers.7.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:29.292.860 [mindspore/train/serialization.py:1369] model.layers.7.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:29.896.317 [mindspore/train/serialization.py:1369] model.layers.7.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:30.475.173 [mindspore/train/serialization.py:1369] model.layers.7.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:31.416.32 [mindspore/train/serialization.py:1369] model.layers.8.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:31.430.28 [mindspore/train/serialization.py:1369] model.layers.8.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:31.435.35 [mindspore/train/serialization.py:1369] model.layers.8.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:31.214.639 [mindspore/train/serialization.py:1369] model.layers.8.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:31.262.329 [mindspore/train/serialization.py:1369] model.layers.8.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:31.310.397 [mindspore/train/serialization.py:1369] model.layers.8.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:31.488.121 [mindspore/train/serialization.py:1369] model.layers.8.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:32.530.91 [mindspore/train/serialization.py:1369] model.layers.8.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:32.641.881 [mindspore/train/serialization.py:1369] model.layers.8.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:33.202.834 [mindspore/train/serialization.py:1369] model.layers.9.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:33.203.653 [mindspore/train/serialization.py:1369] model.layers.9.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:33.204.135 [mindspore/train/serialization.py:1369] model.layers.9.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:33.371.970 [mindspore/train/serialization.py:1369] model.layers.9.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:33.433.449 [mindspore/train/serialization.py:1369] model.layers.9.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:33.485.132 [mindspore/train/serialization.py:1369] model.layers.9.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:33.756.263 [mindspore/train/serialization.py:1369] model.layers.9.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:34.331.422 [mindspore/train/serialization.py:1369] model.layers.9.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:34.944.613 [mindspore/train/serialization.py:1369] model.layers.9.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:35.547.016 [mindspore/train/serialization.py:1369] model.layers.10.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:35.547.829 [mindspore/train/serialization.py:1369] model.layers.10.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:35.548.294 [mindspore/train/serialization.py:1369] model.layers.10.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:35.792.321 [mindspore/train/serialization.py:1369] model.layers.10.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:35.842.290 [mindspore/train/serialization.py:1369] model.layers.10.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:35.916.485 [mindspore/train/serialization.py:1369] model.layers.10.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:36.929.16 [mindspore/train/serialization.py:1369] model.layers.10.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:36.700.852 [mindspore/train/serialization.py:1369] model.layers.10.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:37.304.009 [mindspore/train/serialization.py:1369] model.layers.10.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:37.878.781 [mindspore/train/serialization.py:1369] model.layers.11.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:37.879.841 [mindspore/train/serialization.py:1369] model.layers.11.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:37.880.315 [mindspore/train/serialization.py:1369] model.layers.11.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:38.564.98 [mindspore/train/serialization.py:1369] model.layers.11.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:38.107.789 [mindspore/train/serialization.py:1369] model.layers.11.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:38.160.282 [mindspore/train/serialization.py:1369] model.layers.11.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:38.344.165 [mindspore/train/serialization.py:1369] model.layers.11.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:38.912.638 [mindspore/train/serialization.py:1369] model.layers.11.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:39.475.994 [mindspore/train/serialization.py:1369] model.layers.11.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:40.915.75 [mindspore/train/serialization.py:1369] model.layers.12.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:40.922.70 [mindspore/train/serialization.py:1369] model.layers.12.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:40.929.13 [mindspore/train/serialization.py:1369] model.layers.12.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:40.267.123 [mindspore/train/serialization.py:1369] model.layers.12.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:40.318.044 [mindspore/train/serialization.py:1369] model.layers.12.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:40.369.620 [mindspore/train/serialization.py:1369] model.layers.12.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:40.571.462 [mindspore/train/serialization.py:1369] model.layers.12.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:41.284.253 [mindspore/train/serialization.py:1369] model.layers.12.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:42.118.992 [mindspore/train/serialization.py:1369] model.layers.12.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:42.675.846 [mindspore/train/serialization.py:1369] model.layers.13.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:42.676.642 [mindspore/train/serialization.py:1369] model.layers.13.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:42.677.077 [mindspore/train/serialization.py:1369] model.layers.13.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:42.896.809 [mindspore/train/serialization.py:1369] model.layers.13.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:42.947.167 [mindspore/train/serialization.py:1369] model.layers.13.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:43.111.7 [mindspore/train/serialization.py:1369] model.layers.13.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:43.191.022 [mindspore/train/serialization.py:1369] model.layers.13.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:43.789.068 [mindspore/train/serialization.py:1369] model.layers.13.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:44.404.792 [mindspore/train/serialization.py:1369] model.layers.13.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:44.960.501 [mindspore/train/serialization.py:1369] model.layers.14.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:44.961.368 [mindspore/train/serialization.py:1369] model.layers.14.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:44.961.833 [mindspore/train/serialization.py:1369] model.layers.14.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:45.127.846 [mindspore/train/serialization.py:1369] model.layers.14.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:45.172.107 [mindspore/train/serialization.py:1369] model.layers.14.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:45.215.797 [mindspore/train/serialization.py:1369] model.layers.14.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:45.391.319 [mindspore/train/serialization.py:1369] model.layers.14.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:45.969.874 [mindspore/train/serialization.py:1369] model.layers.14.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:46.564.101 [mindspore/train/serialization.py:1369] model.layers.14.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:47.154.469 [mindspore/train/serialization.py:1369] model.layers.15.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:47.155.309 [mindspore/train/serialization.py:1369] model.layers.15.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:47.155.773 [mindspore/train/serialization.py:1369] model.layers.15.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:47.325.289 [mindspore/train/serialization.py:1369] model.layers.15.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:47.372.765 [mindspore/train/serialization.py:1369] model.layers.15.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:47.420.310 [mindspore/train/serialization.py:1369] model.layers.15.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:47.588.092 [mindspore/train/serialization.py:1369] model.layers.15.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:48.155.644 [mindspore/train/serialization.py:1369] model.layers.15.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:48.725.607 [mindspore/train/serialization.py:1369] model.layers.15.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:49.305.498 [mindspore/train/serialization.py:1369] model.layers.16.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:49.306.313 [mindspore/train/serialization.py:1369] model.layers.16.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:49.306.759 [mindspore/train/serialization.py:1369] model.layers.16.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:49.471.759 [mindspore/train/serialization.py:1369] model.layers.16.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:49.520.549 [mindspore/train/serialization.py:1369] model.layers.16.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:49.568.383 [mindspore/train/serialization.py:1369] model.layers.16.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:49.824.411 [mindspore/train/serialization.py:1369] model.layers.16.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:50.424.088 [mindspore/train/serialization.py:1369] model.layers.16.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:51.346.4 [mindspore/train/serialization.py:1369] model.layers.16.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:51.617.131 [mindspore/train/serialization.py:1369] model.layers.17.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:51.617.910 [mindspore/train/serialization.py:1369] model.layers.17.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:51.618.355 [mindspore/train/serialization.py:1369] model.layers.17.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:51.829.487 [mindspore/train/serialization.py:1369] model.layers.17.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:51.880.253 [mindspore/train/serialization.py:1369] model.layers.17.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:51.938.373 [mindspore/train/serialization.py:1369] model.layers.17.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:52.152.767 [mindspore/train/serialization.py:1369] model.layers.17.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:52.766.719 [mindspore/train/serialization.py:1369] model.layers.17.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:53.392.596 [mindspore/train/serialization.py:1369] model.layers.17.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:53.974.014 [mindspore/train/serialization.py:1369] model.layers.18.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:53.974.935 [mindspore/train/serialization.py:1369] model.layers.18.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:53.975.370 [mindspore/train/serialization.py:1369] model.layers.18.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:54.183.487 [mindspore/train/serialization.py:1369] model.layers.18.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:54.233.393 [mindspore/train/serialization.py:1369] model.layers.18.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:54.280.885 [mindspore/train/serialization.py:1369] model.layers.18.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:54.466.746 [mindspore/train/serialization.py:1369] model.layers.18.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:55.571.17 [mindspore/train/serialization.py:1369] model.layers.18.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:55.627.489 [mindspore/train/serialization.py:1369] model.layers.18.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:56.200.844 [mindspore/train/serialization.py:1369] model.layers.19.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:56.201.624 [mindspore/train/serialization.py:1369] model.layers.19.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:56.202.057 [mindspore/train/serialization.py:1369] model.layers.19.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:56.424.490 [mindspore/train/serialization.py:1369] model.layers.19.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:56.474.104 [mindspore/train/serialization.py:1369] model.layers.19.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:56.524.145 [mindspore/train/serialization.py:1369] model.layers.19.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:56.693.667 [mindspore/train/serialization.py:1369] model.layers.19.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:57.294.032 [mindspore/train/serialization.py:1369] model.layers.19.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:57.864.835 [mindspore/train/serialization.py:1369] model.layers.19.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:58.467.303 [mindspore/train/serialization.py:1369] model.layers.20.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:58.468.048 [mindspore/train/serialization.py:1369] model.layers.20.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:58.468.523 [mindspore/train/serialization.py:1369] model.layers.20.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:58.658.957 [mindspore/train/serialization.py:1369] model.layers.20.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:58.732.669 [mindspore/train/serialization.py:1369] model.layers.20.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:58.783.092 [mindspore/train/serialization.py:1369] model.layers.20.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:58.996.337 [mindspore/train/serialization.py:1369] model.layers.20.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:10:59.609.581 [mindspore/train/serialization.py:1369] model.layers.20.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:00.631.308 [mindspore/train/serialization.py:1369] model.layers.20.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:01.198.861 [mindspore/train/serialization.py:1369] model.layers.21.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:01.199.814 [mindspore/train/serialization.py:1369] model.layers.21.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:01.200.253 [mindspore/train/serialization.py:1369] model.layers.21.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:01.377.896 [mindspore/train/serialization.py:1369] model.layers.21.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:01.426.477 [mindspore/train/serialization.py:1369] model.layers.21.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:01.475.757 [mindspore/train/serialization.py:1369] model.layers.21.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:01.663.017 [mindspore/train/serialization.py:1369] model.layers.21.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:02.242.897 [mindspore/train/serialization.py:1369] model.layers.21.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:02.830.192 [mindspore/train/serialization.py:1369] model.layers.21.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:03.428.778 [mindspore/train/serialization.py:1369] model.layers.22.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:03.429.595 [mindspore/train/serialization.py:1369] model.layers.22.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:03.430.029 [mindspore/train/serialization.py:1369] model.layers.22.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:03.615.188 [mindspore/train/serialization.py:1369] model.layers.22.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:03.664.798 [mindspore/train/serialization.py:1369] model.layers.22.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:03.713.243 [mindspore/train/serialization.py:1369] model.layers.22.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:03.906.849 [mindspore/train/serialization.py:1369] model.layers.22.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:04.490.341 [mindspore/train/serialization.py:1369] model.layers.22.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:05.793.11 [mindspore/train/serialization.py:1369] model.layers.22.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:05.715.001 [mindspore/train/serialization.py:1369] model.layers.23.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:05.715.785 [mindspore/train/serialization.py:1369] model.layers.23.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:05.716.217 [mindspore/train/serialization.py:1369] model.layers.23.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:05.894.020 [mindspore/train/serialization.py:1369] model.layers.23.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:05.944.057 [mindspore/train/serialization.py:1369] model.layers.23.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:05.989.651 [mindspore/train/serialization.py:1369] model.layers.23.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:06.168.114 [mindspore/train/serialization.py:1369] model.layers.23.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:07.142.365 [mindspore/train/serialization.py:1369] model.layers.23.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:07.710.464 [mindspore/train/serialization.py:1369] model.layers.23.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:08.345.469 [mindspore/train/serialization.py:1369] model.layers.24.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:08.346.383 [mindspore/train/serialization.py:1369] model.layers.24.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:08.346.894 [mindspore/train/serialization.py:1369] model.layers.24.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:08.559.729 [mindspore/train/serialization.py:1369] model.layers.24.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:08.614.791 [mindspore/train/serialization.py:1369] model.layers.24.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:08.671.124 [mindspore/train/serialization.py:1369] model.layers.24.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:08.945.919 [mindspore/train/serialization.py:1369] model.layers.24.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:09.523.027 [mindspore/train/serialization.py:1369] model.layers.24.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:10.101.663 [mindspore/train/serialization.py:1369] model.layers.24.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:10.721.859 [mindspore/train/serialization.py:1369] model.layers.25.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:10.722.775 [mindspore/train/serialization.py:1369] model.layers.25.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:10.723.244 [mindspore/train/serialization.py:1369] model.layers.25.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:10.898.019 [mindspore/train/serialization.py:1369] model.layers.25.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:10.950.330 [mindspore/train/serialization.py:1369] model.layers.25.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:11.190. [mindspore/train/serialization.py:1369] model.layers.25.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:11.184.974 [mindspore/train/serialization.py:1369] model.layers.25.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:11.792.512 [mindspore/train/serialization.py:1369] model.layers.25.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:12.519.495 [mindspore/train/serialization.py:1369] model.layers.25.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:13.113.529 [mindspore/train/serialization.py:1369] model.layers.26.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:13.114.311 [mindspore/train/serialization.py:1369] model.layers.26.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:13.114.758 [mindspore/train/serialization.py:1369] model.layers.26.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:13.289.107 [mindspore/train/serialization.py:1369] model.layers.26.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:13.338.810 [mindspore/train/serialization.py:1369] model.layers.26.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:13.387.231 [mindspore/train/serialization.py:1369] model.layers.26.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:13.572.295 [mindspore/train/serialization.py:1369] model.layers.26.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:14.164.779 [mindspore/train/serialization.py:1369] model.layers.26.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:14.930.445 [mindspore/train/serialization.py:1369] model.layers.26.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:15.574.064 [mindspore/train/serialization.py:1369] model.layers.27.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:15.574.974 [mindspore/train/serialization.py:1369] model.layers.27.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:15.575.500 [mindspore/train/serialization.py:1369] model.layers.27.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:15.754.417 [mindspore/train/serialization.py:1369] model.layers.27.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:15.807.791 [mindspore/train/serialization.py:1369] model.layers.27.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:15.874.731 [mindspore/train/serialization.py:1369] model.layers.27.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:16.495.67 [mindspore/train/serialization.py:1369] model.layers.27.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:16.658.668 [mindspore/train/serialization.py:1369] model.layers.27.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:17.222.021 [mindspore/train/serialization.py:1369] model.layers.27.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:17.846.982 [mindspore/train/serialization.py:1369] model.layers.28.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:17.847.718 [mindspore/train/serialization.py:1369] model.layers.28.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:17.848.145 [mindspore/train/serialization.py:1369] model.layers.28.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:18.609.55 [mindspore/train/serialization.py:1369] model.layers.28.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:18.111.223 [mindspore/train/serialization.py:1369] model.layers.28.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:18.173.637 [mindspore/train/serialization.py:1369] model.layers.28.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:18.352.992 [mindspore/train/serialization.py:1369] model.layers.28.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:18.984.416 [mindspore/train/serialization.py:1369] model.layers.28.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:19.560.099 [mindspore/train/serialization.py:1369] model.layers.28.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:20.119.904 [mindspore/train/serialization.py:1369] model.layers.29.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:20.120.859 [mindspore/train/serialization.py:1369] model.layers.29.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:20.121.305 [mindspore/train/serialization.py:1369] model.layers.29.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:20.296.897 [mindspore/train/serialization.py:1369] model.layers.29.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:20.344.952 [mindspore/train/serialization.py:1369] model.layers.29.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:20.394.614 [mindspore/train/serialization.py:1369] model.layers.29.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:20.564.355 [mindspore/train/serialization.py:1369] model.layers.29.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:21.135.180 [mindspore/train/serialization.py:1369] model.layers.29.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:21.743.246 [mindspore/train/serialization.py:1369] model.layers.29.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:22.316.203 [mindspore/train/serialization.py:1369] model.layers.30.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:22.316.958 [mindspore/train/serialization.py:1369] model.layers.30.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:22.317.426 [mindspore/train/serialization.py:1369] model.layers.30.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:22.490.930 [mindspore/train/serialization.py:1369] model.layers.30.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:22.540.827 [mindspore/train/serialization.py:1369] model.layers.30.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:22.588.612 [mindspore/train/serialization.py:1369] model.layers.30.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:22.771.206 [mindspore/train/serialization.py:1369] model.layers.30.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:23.375.618 [mindspore/train/serialization.py:1369] model.layers.30.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:23.979.866 [mindspore/train/serialization.py:1369] model.layers.30.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:24.599.654 [mindspore/train/serialization.py:1369] model.layers.31.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:24.600.443 [mindspore/train/serialization.py:1369] model.layers.31.attention_norm.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:24.600.904 [mindspore/train/serialization.py:1369] model.layers.31.attention.wq.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:24.801.141 [mindspore/train/serialization.py:1369] model.layers.31.attention.wk.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:24.851.501 [mindspore/train/serialization.py:1369] model.layers.31.attention.wv.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:24.899.166 [mindspore/train/serialization.py:1369] model.layers.31.attention.wo.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:25.860.75 [mindspore/train/serialization.py:1369] model.layers.31.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:25.887.542 [mindspore/train/serialization.py:1369] model.layers.31.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:26.461.136 [mindspore/train/serialization.py:1369] model.layers.31.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:27.754.56 [mindspore/train/serialization.py:1369] model.norm_out.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:27.762.44 [mindspore/train/serialization.py:1369] lm_head.weight is not init while load ckpt. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:56.107.485 [mindspore/train/serialization.py:195] The type of model.layers.0.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:11:56.111.949 [mindspore/train/serialization.py:195] The type of model.layers.0.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:12:03.294.165 [mindspore/train/serialization.py:195] The type of model.layers.1.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:12:03.298.052 [mindspore/train/serialization.py:195] The type of model.layers.1.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:12:10.401.977 [mindspore/train/serialization.py:195] The type of model.layers.2.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:12:10.405.867 [mindspore/train/serialization.py:195] The type of model.layers.2.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:12:17.600.214 [mindspore/train/serialization.py:195] The type of model.layers.3.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:12:17.604.063 [mindspore/train/serialization.py:195] The type of model.layers.3.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:12:24.720.596 [mindspore/train/serialization.py:195] The type of model.layers.4.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:12:24.724.447 [mindspore/train/serialization.py:195] The type of model.layers.4.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:12:31.760.926 [mindspore/train/serialization.py:195] The type of model.layers.5.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:12:31.764.888 [mindspore/train/serialization.py:195] The type of model.layers.5.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:12:38.850.726 [mindspore/train/serialization.py:195] The type of model.layers.6.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:12:38.854.630 [mindspore/train/serialization.py:195] The type of model.layers.6.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:12:46.238.46 [mindspore/train/serialization.py:195] The type of model.layers.7.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:12:46.276.23 [mindspore/train/serialization.py:195] The type of model.layers.7.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:12:53.416.505 [mindspore/train/serialization.py:195] The type of model.layers.8.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:12:53.420.602 [mindspore/train/serialization.py:195] The type of model.layers.8.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:13:00.553.337 [mindspore/train/serialization.py:195] The type of model.layers.9.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:13:00.557.136 [mindspore/train/serialization.py:195] The type of model.layers.9.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:13:07.697.639 [mindspore/train/serialization.py:195] The type of model.layers.10.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:13:07.701.688 [mindspore/train/serialization.py:195] The type of model.layers.10.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:13:14.849.920 [mindspore/train/serialization.py:195] The type of model.layers.11.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:13:14.853.758 [mindspore/train/serialization.py:195] The type of model.layers.11.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:13:22.156.647 [mindspore/train/serialization.py:195] The type of model.layers.12.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:13:22.160.599 [mindspore/train/serialization.py:195] The type of model.layers.12.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:13:29.480.176 [mindspore/train/serialization.py:195] The type of model.layers.13.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:13:29.484.045 [mindspore/train/serialization.py:195] The type of model.layers.13.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:13:36.564.650 [mindspore/train/serialization.py:195] The type of model.layers.14.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:13:36.568.726 [mindspore/train/serialization.py:195] The type of model.layers.14.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:13:43.633.258 [mindspore/train/serialization.py:195] The type of model.layers.15.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:13:43.637.138 [mindspore/train/serialization.py:195] The type of model.layers.15.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:13:50.663.834 [mindspore/train/serialization.py:195] The type of model.layers.16.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:13:50.667.776 [mindspore/train/serialization.py:195] The type of model.layers.16.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:13:57.691.875 [mindspore/train/serialization.py:195] The type of model.layers.17.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:13:57.695.909 [mindspore/train/serialization.py:195] The type of model.layers.17.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:14:04.805.910 [mindspore/train/serialization.py:195] The type of model.layers.18.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:14:04.809.886 [mindspore/train/serialization.py:195] The type of model.layers.18.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:14:11.858.189 [mindspore/train/serialization.py:195] The type of model.layers.19.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:14:11.862.456 [mindspore/train/serialization.py:195] The type of model.layers.19.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:14:18.937.711 [mindspore/train/serialization.py:195] The type of model.layers.20.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:14:18.941.708 [mindspore/train/serialization.py:195] The type of model.layers.20.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:14:26.144.25 [mindspore/train/serialization.py:195] The type of model.layers.21.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:14:26.183.83 [mindspore/train/serialization.py:195] The type of model.layers.21.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:14:33.647.36 [mindspore/train/serialization.py:195] The type of model.layers.22.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:14:33.689.17 [mindspore/train/serialization.py:195] The type of model.layers.22.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:14:40.197.856 [mindspore/train/serialization.py:195] The type of model.layers.23.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:14:40.201.750 [mindspore/train/serialization.py:195] The type of model.layers.23.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:14:47.348.194 [mindspore/train/serialization.py:195] The type of model.layers.24.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:14:47.352.332 [mindspore/train/serialization.py:195] The type of model.layers.24.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:14:54.468.039 [mindspore/train/serialization.py:195] The type of model.layers.25.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:14:54.471.993 [mindspore/train/serialization.py:195] The type of model.layers.25.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:15:01.542.963 [mindspore/train/serialization.py:195] The type of model.layers.26.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:15:01.546.938 [mindspore/train/serialization.py:195] The type of model.layers.26.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:15:08.568.854 [mindspore/train/serialization.py:195] The type of model.layers.27.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:15:08.572.905 [mindspore/train/serialization.py:195] The type of model.layers.27.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:15:15.641.774 [mindspore/train/serialization.py:195] The type of model.layers.28.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:15:15.645.771 [mindspore/train/serialization.py:195] The type of model.layers.28.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:15:22.689.901 [mindspore/train/serialization.py:195] The type of model.layers.29.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:15:22.693.820 [mindspore/train/serialization.py:195] The type of model.layers.29.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:15:29.848.015 [mindspore/train/serialization.py:195] The type of model.layers.30.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:15:29.852.211 [mindspore/train/serialization.py:195] The type of model.layers.30.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:15:37.108.07 [mindspore/train/serialization.py:195] The type of model.layers.31.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:15:37.147.59 [mindspore/train/serialization.py:195] The type of model.layers.31.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:15:44.852.14 [mindspore/train/serialization.py:195] The type of model.norm_out.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:16:02.680.574 [mindspore/train/serialization.py:1456] For 'load_param_into_net', 128 parameters in the 'net' are not loaded, because they are not in the 'parameter_dict', please check whether the network structure is consistent when training and loading checkpoint. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:16:02.681.031 [mindspore/train/serialization.py:1460] ['model.layers.0.attention.wq.mindpet_delta_lora_a', 'model.layers.0.attention.wq.mindpet_delta_lora_b', 'model.layers.0.attention.wv.mindpet_delta_lora_a', 'model.layers.0.attention.wv.mindpet_delta_lora_b', 'model.layers.1.attention.wq.mindpet_delta_lora_a', 'model.layers.1.attention.wq.mindpet_delta_lora_b', 'model.layers.1.attention.wv.mindpet_delta_lora_a', 'model.layers.1.attention.wv.mindpet_delta_lora_b', 'model.layers.2.attention.wq.mindpet_delta_lora_a', 'model.layers.2.attention.wq.mindpet_delta_lora_b', 'model.layers.2.attention.wv.mindpet_delta_lora_a', 'model.layers.2.attention.wv.mindpet_delta_lora_b', 'model.layers.3.attention.wq.mindpet_delta_lora_a', 'model.layers.3.attention.wq.mindpet_delta_lora_b', 'model.layers.3.attention.wv.mindpet_delta_lora_a', 'model.layers.3.attention.wv.mindpet_delta_lora_b', 'model.layers.4.attention.wq.mindpet_delta_lora_a', 'model.layers.4.attention.wq.mindpet_delta_lora_b', 'model.layers.4.attention.wv.mindpet_delta_lora_a', 'model.layers.4.attention.wv.mindpet_delta_lora_b', 'model.layers.5.attention.wq.mindpet_delta_lora_a', 'model.layers.5.attention.wq.mindpet_delta_lora_b', 'model.layers.5.attention.wv.mindpet_delta_lora_a', 'model.layers.5.attention.wv.mindpet_delta_lora_b', 'model.layers.6.attention.wq.mindpet_delta_lora_a', 'model.layers.6.attention.wq.mindpet_delta_lora_b', 'model.layers.6.attention.wv.mindpet_delta_lora_a', 'model.layers.6.attention.wv.mindpet_delta_lora_b', 'model.layers.7.attention.wq.mindpet_delta_lora_a', 'model.layers.7.attention.wq.mindpet_delta_lora_b', 'model.layers.7.attention.wv.mindpet_delta_lora_a', 'model.layers.7.attention.wv.mindpet_delta_lora_b', 'model.layers.8.attention.wq.mindpet_delta_lora_a', 'model.layers.8.attention.wq.mindpet_delta_lora_b', 'model.layers.8.attention.wv.mindpet_delta_lora_a', 'model.layers.8.attention.wv.mindpet_delta_lora_b', 'model.layers.9.attention.wq.mindpet_delta_lora_a', 'model.layers.9.attention.wq.mindpet_delta_lora_b', 'model.layers.9.attention.wv.mindpet_delta_lora_a', 'model.layers.9.attention.wv.mindpet_delta_lora_b', 'model.layers.10.attention.wq.mindpet_delta_lora_a', 'model.layers.10.attention.wq.mindpet_delta_lora_b', 'model.layers.10.attention.wv.mindpet_delta_lora_a', 'model.layers.10.attention.wv.mindpet_delta_lora_b', 'model.layers.11.attention.wq.mindpet_delta_lora_a', 'model.layers.11.attention.wq.mindpet_delta_lora_b', 'model.layers.11.attention.wv.mindpet_delta_lora_a', 'model.layers.11.attention.wv.mindpet_delta_lora_b', 'model.layers.12.attention.wq.mindpet_delta_lora_a', 'model.layers.12.attention.wq.mindpet_delta_lora_b', 'model.layers.12.attention.wv.mindpet_delta_lora_a', 'model.layers.12.attention.wv.mindpet_delta_lora_b', 'model.layers.13.attention.wq.mindpet_delta_lora_a', 'model.layers.13.attention.wq.mindpet_delta_lora_b', 'model.layers.13.attention.wv.mindpet_delta_lora_a', 'model.layers.13.attention.wv.mindpet_delta_lora_b', 'model.layers.14.attention.wq.mindpet_delta_lora_a', 'model.layers.14.attention.wq.mindpet_delta_lora_b', 'model.layers.14.attention.wv.mindpet_delta_lora_a', 'model.layers.14.attention.wv.mindpet_delta_lora_b', 'model.layers.15.attention.wq.mindpet_delta_lora_a', 'model.layers.15.attention.wq.mindpet_delta_lora_b', 'model.layers.15.attention.wv.mindpet_delta_lora_a', 'model.layers.15.attention.wv.mindpet_delta_lora_b', 'model.layers.16.attention.wq.mindpet_delta_lora_a', 'model.layers.16.attention.wq.mindpet_delta_lora_b', 'model.layers.16.attention.wv.mindpet_delta_lora_a', 'model.layers.16.attention.wv.mindpet_delta_lora_b', 'model.layers.17.attention.wq.mindpet_delta_lora_a', 'model.layers.17.attention.wq.mindpet_delta_lora_b', 'model.layers.17.attention.wv.mindpet_delta_lora_a', 'model.layers.17.attention.wv.mindpet_delta_lora_b', 'model.layers.18.attention.wq.mindpet_delta_lora_a', 'model.layers.18.attention.wq.mindpet_delta_lora_b', 'model.layers.18.attention.wv.mindpet_delta_lora_a', 'model.layers.18.attention.wv.mindpet_delta_lora_b', 'model.layers.19.attention.wq.mindpet_delta_lora_a', 'model.layers.19.attention.wq.mindpet_delta_lora_b', 'model.layers.19.attention.wv.mindpet_delta_lora_a', 'model.layers.19.attention.wv.mindpet_delta_lora_b', 'model.layers.20.attention.wq.mindpet_delta_lora_a', 'model.layers.20.attention.wq.mindpet_delta_lora_b', 'model.layers.20.attention.wv.mindpet_delta_lora_a', 'model.layers.20.attention.wv.mindpet_delta_lora_b', 'model.layers.21.attention.wq.mindpet_delta_lora_a', 'model.layers.21.attention.wq.mindpet_delta_lora_b', 'model.layers.21.attention.wv.mindpet_delta_lora_a', 'model.layers.21.attention.wv.mindpet_delta_lora_b', 'model.layers.22.attention.wq.mindpet_delta_lora_a', 'model.layers.22.attention.wq.mindpet_delta_lora_b', 'model.layers.22.attention.wv.mindpet_delta_lora_a', 'model.layers.22.attention.wv.mindpet_delta_lora_b', 'model.layers.23.attention.wq.mindpet_delta_lora_a', 'model.layers.23.attention.wq.mindpet_delta_lora_b', 'model.layers.23.attention.wv.mindpet_delta_lora_a', 'model.layers.23.attention.wv.mindpet_delta_lora_b', 'model.layers.24.attention.wq.mindpet_delta_lora_a', 'model.layers.24.attention.wq.mindpet_delta_lora_b', 'model.layers.24.attention.wv.mindpet_delta_lora_a', 'model.layers.24.attention.wv.mindpet_delta_lora_b', 'model.layers.25.attention.wq.mindpet_delta_lora_a', 'model.layers.25.attention.wq.mindpet_delta_lora_b', 'model.layers.25.attention.wv.mindpet_delta_lora_a', 'model.layers.25.attention.wv.mindpet_delta_lora_b', 'model.layers.26.attention.wq.mindpet_delta_lora_a', 'model.layers.26.attention.wq.mindpet_delta_lora_b', 'model.layers.26.attention.wv.mindpet_delta_lora_a', 'model.layers.26.attention.wv.mindpet_delta_lora_b', 'model.layers.27.attention.wq.mindpet_delta_lora_a', 'model.layers.27.attention.wq.mindpet_delta_lora_b', 'model.layers.27.attention.wv.mindpet_delta_lora_a', 'model.layers.27.attention.wv.mindpet_delta_lora_b', 'model.layers.28.attention.wq.mindpet_delta_lora_a', 'model.layers.28.attention.wq.mindpet_delta_lora_b', 'model.layers.28.attention.wv.mindpet_delta_lora_a', 'model.layers.28.attention.wv.mindpet_delta_lora_b', 'model.layers.29.attention.wq.mindpet_delta_lora_a', 'model.layers.29.attention.wq.mindpet_delta_lora_b', 'model.layers.29.attention.wv.mindpet_delta_lora_a', 'model.layers.29.attention.wv.mindpet_delta_lora_b', 'model.layers.30.attention.wq.mindpet_delta_lora_a', 'model.layers.30.attention.wq.mindpet_delta_lora_b', 'model.layers.30.attention.wv.mindpet_delta_lora_a', 'model.layers.30.attention.wv.mindpet_delta_lora_b', 'model.layers.31.attention.wq.mindpet_delta_lora_a', 'model.layers.31.attention.wq.mindpet_delta_lora_b', 'model.layers.31.attention.wv.mindpet_delta_lora_a', 'model.layers.31.attention.wv.mindpet_delta_lora_b'] are not loaded. +2024-07-30 02:16:02,681 - mindformers[mindformers/trainer/utils.py:767] - INFO - Network parameters are not loaded: (['model.layers.0.attention.wq.mindpet_delta_lora_a', 'model.layers.0.attention.wq.mindpet_delta_lora_b', 'model.layers.0.attention.wv.mindpet_delta_lora_a', 'model.layers.0.attention.wv.mindpet_delta_lora_b', 'model.layers.1.attention.wq.mindpet_delta_lora_a', 'model.layers.1.attention.wq.mindpet_delta_lora_b', 'model.layers.1.attention.wv.mindpet_delta_lora_a', 'model.layers.1.attention.wv.mindpet_delta_lora_b', 'model.layers.2.attention.wq.mindpet_delta_lora_a', 'model.layers.2.attention.wq.mindpet_delta_lora_b', 'model.layers.2.attention.wv.mindpet_delta_lora_a', 'model.layers.2.attention.wv.mindpet_delta_lora_b', 'model.layers.3.attention.wq.mindpet_delta_lora_a', 'model.layers.3.attention.wq.mindpet_delta_lora_b', 'model.layers.3.attention.wv.mindpet_delta_lora_a', 'model.layers.3.attention.wv.mindpet_delta_lora_b', 'model.layers.4.attention.wq.mindpet_delta_lora_a', 'model.layers.4.attention.wq.mindpet_delta_lora_b', 'model.layers.4.attention.wv.mindpet_delta_lora_a', 'model.layers.4.attention.wv.mindpet_delta_lora_b', 'model.layers.5.attention.wq.mindpet_delta_lora_a', 'model.layers.5.attention.wq.mindpet_delta_lora_b', 'model.layers.5.attention.wv.mindpet_delta_lora_a', 'model.layers.5.attention.wv.mindpet_delta_lora_b', 'model.layers.6.attention.wq.mindpet_delta_lora_a', 'model.layers.6.attention.wq.mindpet_delta_lora_b', 'model.layers.6.attention.wv.mindpet_delta_lora_a', 'model.layers.6.attention.wv.mindpet_delta_lora_b', 'model.layers.7.attention.wq.mindpet_delta_lora_a', 'model.layers.7.attention.wq.mindpet_delta_lora_b', 'model.layers.7.attention.wv.mindpet_delta_lora_a', 'model.layers.7.attention.wv.mindpet_delta_lora_b', 'model.layers.8.attention.wq.mindpet_delta_lora_a', 'model.layers.8.attention.wq.mindpet_delta_lora_b', 'model.layers.8.attention.wv.mindpet_delta_lora_a', 'model.layers.8.attention.wv.mindpet_delta_lora_b', 'model.layers.9.attention.wq.mindpet_delta_lora_a', 'model.layers.9.attention.wq.mindpet_delta_lora_b', 'model.layers.9.attention.wv.mindpet_delta_lora_a', 'model.layers.9.attention.wv.mindpet_delta_lora_b', 'model.layers.10.attention.wq.mindpet_delta_lora_a', 'model.layers.10.attention.wq.mindpet_delta_lora_b', 'model.layers.10.attention.wv.mindpet_delta_lora_a', 'model.layers.10.attention.wv.mindpet_delta_lora_b', 'model.layers.11.attention.wq.mindpet_delta_lora_a', 'model.layers.11.attention.wq.mindpet_delta_lora_b', 'model.layers.11.attention.wv.mindpet_delta_lora_a', 'model.layers.11.attention.wv.mindpet_delta_lora_b', 'model.layers.12.attention.wq.mindpet_delta_lora_a', 'model.layers.12.attention.wq.mindpet_delta_lora_b', 'model.layers.12.attention.wv.mindpet_delta_lora_a', 'model.layers.12.attention.wv.mindpet_delta_lora_b', 'model.layers.13.attention.wq.mindpet_delta_lora_a', 'model.layers.13.attention.wq.mindpet_delta_lora_b', 'model.layers.13.attention.wv.mindpet_delta_lora_a', 'model.layers.13.attention.wv.mindpet_delta_lora_b', 'model.layers.14.attention.wq.mindpet_delta_lora_a', 'model.layers.14.attention.wq.mindpet_delta_lora_b', 'model.layers.14.attention.wv.mindpet_delta_lora_a', 'model.layers.14.attention.wv.mindpet_delta_lora_b', 'model.layers.15.attention.wq.mindpet_delta_lora_a', 'model.layers.15.attention.wq.mindpet_delta_lora_b', 'model.layers.15.attention.wv.mindpet_delta_lora_a', 'model.layers.15.attention.wv.mindpet_delta_lora_b', 'model.layers.16.attention.wq.mindpet_delta_lora_a', 'model.layers.16.attention.wq.mindpet_delta_lora_b', 'model.layers.16.attention.wv.mindpet_delta_lora_a', 'model.layers.16.attention.wv.mindpet_delta_lora_b', 'model.layers.17.attention.wq.mindpet_delta_lora_a', 'model.layers.17.attention.wq.mindpet_delta_lora_b', 'model.layers.17.attention.wv.mindpet_delta_lora_a', 'model.layers.17.attention.wv.mindpet_delta_lora_b', 'model.layers.18.attention.wq.mindpet_delta_lora_a', 'model.layers.18.attention.wq.mindpet_delta_lora_b', 'model.layers.18.attention.wv.mindpet_delta_lora_a', 'model.layers.18.attention.wv.mindpet_delta_lora_b', 'model.layers.19.attention.wq.mindpet_delta_lora_a', 'model.layers.19.attention.wq.mindpet_delta_lora_b', 'model.layers.19.attention.wv.mindpet_delta_lora_a', 'model.layers.19.attention.wv.mindpet_delta_lora_b', 'model.layers.20.attention.wq.mindpet_delta_lora_a', 'model.layers.20.attention.wq.mindpet_delta_lora_b', 'model.layers.20.attention.wv.mindpet_delta_lora_a', 'model.layers.20.attention.wv.mindpet_delta_lora_b', 'model.layers.21.attention.wq.mindpet_delta_lora_a', 'model.layers.21.attention.wq.mindpet_delta_lora_b', 'model.layers.21.attention.wv.mindpet_delta_lora_a', 'model.layers.21.attention.wv.mindpet_delta_lora_b', 'model.layers.22.attention.wq.mindpet_delta_lora_a', 'model.layers.22.attention.wq.mindpet_delta_lora_b', 'model.layers.22.attention.wv.mindpet_delta_lora_a', 'model.layers.22.attention.wv.mindpet_delta_lora_b', 'model.layers.23.attention.wq.mindpet_delta_lora_a', 'model.layers.23.attention.wq.mindpet_delta_lora_b', 'model.layers.23.attention.wv.mindpet_delta_lora_a', 'model.layers.23.attention.wv.mindpet_delta_lora_b', 'model.layers.24.attention.wq.mindpet_delta_lora_a', 'model.layers.24.attention.wq.mindpet_delta_lora_b', 'model.layers.24.attention.wv.mindpet_delta_lora_a', 'model.layers.24.attention.wv.mindpet_delta_lora_b', 'model.layers.25.attention.wq.mindpet_delta_lora_a', 'model.layers.25.attention.wq.mindpet_delta_lora_b', 'model.layers.25.attention.wv.mindpet_delta_lora_a', 'model.layers.25.attention.wv.mindpet_delta_lora_b', 'model.layers.26.attention.wq.mindpet_delta_lora_a', 'model.layers.26.attention.wq.mindpet_delta_lora_b', 'model.layers.26.attention.wv.mindpet_delta_lora_a', 'model.layers.26.attention.wv.mindpet_delta_lora_b', 'model.layers.27.attention.wq.mindpet_delta_lora_a', 'model.layers.27.attention.wq.mindpet_delta_lora_b', 'model.layers.27.attention.wv.mindpet_delta_lora_a', 'model.layers.27.attention.wv.mindpet_delta_lora_b', 'model.layers.28.attention.wq.mindpet_delta_lora_a', 'model.layers.28.attention.wq.mindpet_delta_lora_b', 'model.layers.28.attention.wv.mindpet_delta_lora_a', 'model.layers.28.attention.wv.mindpet_delta_lora_b', 'model.layers.29.attention.wq.mindpet_delta_lora_a', 'model.layers.29.attention.wq.mindpet_delta_lora_b', 'model.layers.29.attention.wv.mindpet_delta_lora_a', 'model.layers.29.attention.wv.mindpet_delta_lora_b', 'model.layers.30.attention.wq.mindpet_delta_lora_a', 'model.layers.30.attention.wq.mindpet_delta_lora_b', 'model.layers.30.attention.wv.mindpet_delta_lora_a', 'model.layers.30.attention.wv.mindpet_delta_lora_b', 'model.layers.31.attention.wq.mindpet_delta_lora_a', 'model.layers.31.attention.wq.mindpet_delta_lora_b', 'model.layers.31.attention.wv.mindpet_delta_lora_a', 'model.layers.31.attention.wv.mindpet_delta_lora_b'], []) +2024-07-30 02:16:02,682 - mindformers[mindformers/trainer/base_trainer.py:770] - INFO - .........Starting Training Model.......... +2024-07-30 02:16:02,682 - mindformers[mindformers/trainer/base_trainer.py:773] - INFO - .........Model Compiling, Please Wait a Moment........... +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:16:02.683.504 [mindspore/train/model.py:1120] For MFLossMonitor callback, {'step_begin', 'step_end', 'epoch_begin', 'epoch_end'} methods may not be supported in later version, Use methods prefixed with 'on_train' or 'on_eval' instead when using customized callbacks. +[WARNING] ME(978993:281473388404752,MainProcess):2024-07-30-02:16:02.683.641 [mindspore/train/model.py:1120] For Local2ObsMonitor callback, {'step_end', 'epoch_end'} methods may not be supported in later version, Use methods prefixed with 'on_train' or 'on_eval' instead when using customized callbacks. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.812.109 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/31-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.812.886 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/30-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.813.576 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/29-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.814.254 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/28-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.814.925 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/27-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.815.599 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/26-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.816.297 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/25-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.816.989 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/24-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.817.668 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/23-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.818.340 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/22-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.819.015 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/21-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.819.682 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/20-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.820.346 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/19-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.821.017 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/18-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.821.685 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/17-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.822.338 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/16-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.823.005 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/15-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.823.654 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/14-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.824.313 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/13-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.824.987 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/12-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.825.656 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/11-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.826.312 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/10-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.826.980 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/9-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.827.637 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/8-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.828.295 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/7-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.828.952 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/6-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.829.612 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/5-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.830.258 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/4-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.830.921 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/3-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.831.553 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/2-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.832.211 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/1-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.832.893 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/0-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.833.358 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/0-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.834.094 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/1-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.834.836 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/2-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.835.572 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/3-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.836.317 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/4-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.837.077 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/5-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.837.837 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/6-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.838.579 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/7-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.839.328 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/8-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.840.077 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/9-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.840.842 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/10-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.841.576 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/11-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.842.287 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/12-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.843.002 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/13-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.843.727 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/14-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.844.422 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/15-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.845.146 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/16-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.845.878 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/17-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.846.585 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/18-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.847.301 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/19-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.848.004 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/20-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.848.717 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/21-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.849.435 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/22-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.850.129 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/23-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.850.838 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/24-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.851.544 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/25-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.852.244 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/26-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.852.965 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/27-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.853.646 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/28-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.854.304 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/29-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.854.956 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/30-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:30.855.570 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/31-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(978993,ffffa1546010,python):2024-07-30-02:16:33.375.367 [mindspore/ccsrc/frontend/parallel/graph_util/graph_utils.cc:68] GetTensorRedistributionFromCNode] Default/network-MFTrainOneStepCell/clip_grad_norm-ClipGradNorm/Sqrt-op0 has no OperatorInfo. +- \ | 2024-07-30 02:26:19,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2/ 3125], loss: 1.392, per_step_time: 307388ms, lr: 3.558719e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:19,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.0% | | 0.02603 samples/s/p 33 days, 8:19:08 } +2024-07-30 02:26:23,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 4/ 3125], loss: 1.327, per_step_time: 1473ms, lr: 1.0676156e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:23,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.0% | | 5.42763 samples/s/p 3:50:12 } +2024-07-30 02:26:26,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 6/ 3125], loss: 1.193, per_step_time: 1413ms, lr: 1.7793593e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:26,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.66138 samples/s/p 3:40:39 } +2024-07-30 02:26:28,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 8/ 3125], loss: 1.399, per_step_time: 1415ms, lr: 2.4911031e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:28,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.65002 samples/s/p 3:41:02 } +2024-07-30 02:26:31,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 10/ 3125], loss: 1.360, per_step_time: 1416ms, lr: 3.202847e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:31,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.64722 samples/s/p 3:41:06 } +2024-07-30 02:26:34,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 12/ 3125], loss: 1.379, per_step_time: 1414ms, lr: 3.9145905e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:34,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.65752 samples/s/p 3:40:39 } +2024-07-30 02:26:37,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 14/ 3125], loss: 1.350, per_step_time: 1413ms, lr: 4.6263344e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:37,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.65808 samples/s/p 3:40:35 } +2024-07-30 02:26:40,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 16/ 3125], loss: 1.343, per_step_time: 1413ms, lr: 5.3380785e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:40,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.66001 samples/s/p 3:40:28 } +2024-07-30 02:26:43,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 18/ 3125], loss: 1.049, per_step_time: 1413ms, lr: 6.049822e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:43,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.65876 samples/s/p 3:40:28 } +2024-07-30 02:26:45,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 20/ 3125], loss: 1.286, per_step_time: 1413ms, lr: 6.7615656e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:45,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.65873 samples/s/p 3:40:25 } +2024-07-30 02:26:48,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 22/ 3125], loss: 1.170, per_step_time: 1413ms, lr: 7.473309e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:48,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.65864 samples/s/p 3:40:22 } +2024-07-30 02:26:51,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 24/ 3125], loss: 1.197, per_step_time: 1413ms, lr: 8.185053e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:51,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.65987 samples/s/p 3:40:17 } +2024-07-30 02:26:54,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 26/ 3125], loss: 1.367, per_step_time: 1413ms, lr: 8.896797e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:54,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.65864 samples/s/p 3:40:17 } +2024-07-30 02:26:57,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 28/ 3125], loss: 1.430, per_step_time: 1414ms, lr: 9.608541e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:57,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.65767 samples/s/p 3:40:16 } +2024-07-30 02:27:00,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 30/ 3125], loss: 1.447, per_step_time: 1412ms, lr: 1.0320284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:00,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.66214 samples/s/p 3:40:03 } +2024-07-30 02:27:02,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 32/ 3125], loss: 1.653, per_step_time: 1415ms, lr: 1.1032029e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:02,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.65222 samples/s/p 3:40:23 } +2024-07-30 02:27:05,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 34/ 3125], loss: 1.188, per_step_time: 1424ms, lr: 1.1743772e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:05,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.61641 samples/s/p 3:41:45 } +2024-07-30 02:27:08,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 36/ 3125], loss: 1.306, per_step_time: 1414ms, lr: 1.2455515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:08,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.65568 samples/s/p 3:40:10 } +2024-07-30 02:27:11,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 38/ 3125], loss: 1.332, per_step_time: 1413ms, lr: 1.3167258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:11,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.66006 samples/s/p 3:39:57 } +2024-07-30 02:27:14,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 40/ 3125], loss: 1.375, per_step_time: 1416ms, lr: 1.3879004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:14,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.64927 samples/s/p 3:40:19 } +2024-07-30 02:27:17,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 42/ 3125], loss: 1.420, per_step_time: 1413ms, lr: 1.4590747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:17,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.65917 samples/s/p 3:39:53 } +2024-07-30 02:27:19,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 44/ 3125], loss: 1.437, per_step_time: 1412ms, lr: 1.530249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:19,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.66191 samples/s/p 3:39:44 } +2024-07-30 02:27:22,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 46/ 3125], loss: 1.287, per_step_time: 1413ms, lr: 1.6014234e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:22,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.66121 samples/s/p 3:39:43 } +2024-07-30 02:27:25,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 48/ 3125], loss: 1.380, per_step_time: 1414ms, lr: 1.6725978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:25,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.65428 samples/s/p 3:39:56 } +2024-07-30 02:27:28,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 50/ 3125], loss: 1.100, per_step_time: 1413ms, lr: 1.7437721e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:28,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.65907 samples/s/p 3:39:42 } +2024-07-30 02:27:31,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 52/ 3125], loss: 1.361, per_step_time: 1413ms, lr: 1.8149465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:31,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.65776 samples/s/p 3:39:42 } +2024-07-30 02:27:34,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 54/ 3125], loss: 1.508, per_step_time: 1413ms, lr: 1.886121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:34,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.65971 samples/s/p 3:39:35 } +2024-07-30 02:27:36,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 56/ 3125], loss: 1.341, per_step_time: 1413ms, lr: 1.9572954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:36,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.66017 samples/s/p 3:39:31 } +2024-07-30 02:27:39,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 58/ 3125], loss: 1.275, per_step_time: 1413ms, lr: 2.0284697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:39,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.66074 samples/s/p 3:39:27 } +2024-07-30 02:27:42,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 60/ 3125], loss: 1.126, per_step_time: 1414ms, lr: 2.099644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:42,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.65509 samples/s/p 3:39:37 } +2024-07-30 02:27:45,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 62/ 3125], loss: 1.619, per_step_time: 1414ms, lr: 2.1708183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:45,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.65732 samples/s/p 3:39:29 } +2024-07-30 02:27:48,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 64/ 3125], loss: 1.251, per_step_time: 1415ms, lr: 2.2419927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:48,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.65098 samples/s/p 3:39:41 } +2024-07-30 02:27:51,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 66/ 3125], loss: 1.324, per_step_time: 1413ms, lr: 2.3131672e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:51,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.65923 samples/s/p 3:39:19 } +2024-07-30 02:27:53,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 68/ 3125], loss: 1.160, per_step_time: 1413ms, lr: 2.3843415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:53,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.65790 samples/s/p 3:39:19 } +2024-07-30 02:27:56,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 70/ 3125], loss: 1.056, per_step_time: 1413ms, lr: 2.4555159e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:56,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.65810 samples/s/p 3:39:16 } +2024-07-30 02:27:59,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 72/ 3125], loss: 1.486, per_step_time: 1415ms, lr: 2.5266902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:59,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.65284 samples/s/p 3:39:25 } +2024-07-30 02:28:02,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 74/ 3125], loss: 1.359, per_step_time: 1414ms, lr: 2.5978647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:02,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.65613 samples/s/p 3:39:15 } +2024-07-30 02:28:05,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 76/ 3125], loss: 1.356, per_step_time: 1415ms, lr: 2.669039e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:05,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.65151 samples/s/p 3:39:23 } +2024-07-30 02:28:08,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 78/ 3125], loss: 1.349, per_step_time: 1413ms, lr: 2.7402134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:08,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.65808 samples/s/p 3:39:05 } +2024-07-30 02:28:10,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 80/ 3125], loss: 1.630, per_step_time: 1413ms, lr: 2.8113877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:10,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.66110 samples/s/p 3:38:55 } +2024-07-30 02:28:13,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 82/ 3125], loss: 1.549, per_step_time: 1413ms, lr: 2.8825623e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:13,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.65865 samples/s/p 3:38:58 } +2024-07-30 02:28:16,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 84/ 3125], loss: 1.097, per_step_time: 1413ms, lr: 2.9537364e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:16,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.65886 samples/s/p 3:38:54 } +2024-07-30 02:28:19,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 86/ 3125], loss: 1.357, per_step_time: 1413ms, lr: 3.024911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:19,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.66091 samples/s/p 3:38:47 } +2024-07-30 02:28:22,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 88/ 3125], loss: 1.011, per_step_time: 1416ms, lr: 3.0960855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:22,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.64775 samples/s/p 3:39:14 } +2024-07-30 02:28:25,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 90/ 3125], loss: 0.990, per_step_time: 1413ms, lr: 3.1672596e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:25,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.66058 samples/s/p 3:38:42 } +2024-07-30 02:28:27,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 92/ 3125], loss: 1.119, per_step_time: 1414ms, lr: 3.2384341e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:27,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.65503 samples/s/p 3:38:52 } +2024-07-30 02:28:30,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 94/ 3125], loss: 1.152, per_step_time: 1414ms, lr: 3.3096082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:30,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.65755 samples/s/p 3:38:43 } +2024-07-30 02:28:33,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 96/ 3125], loss: 1.270, per_step_time: 1413ms, lr: 3.3807828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:33,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.65906 samples/s/p 3:38:37 } +2024-07-30 02:28:36,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 98/ 3125], loss: 1.162, per_step_time: 1415ms, lr: 3.4519574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:36,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.65354 samples/s/p 3:38:47 } +2024-07-30 02:28:39,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 100/ 3125], loss: 0.916, per_step_time: 1413ms, lr: 3.5231315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:39,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.66082 samples/s/p 3:38:27 } +2024-07-30 02:28:42,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 102/ 3125], loss: 1.030, per_step_time: 1414ms, lr: 3.594306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:42,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.65606 samples/s/p 3:38:35 } +2024-07-30 02:28:44,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 104/ 3125], loss: 1.432, per_step_time: 1415ms, lr: 3.6654803e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:44,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.65238 samples/s/p 3:38:41 } +2024-07-30 02:28:47,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 106/ 3125], loss: 1.152, per_step_time: 1413ms, lr: 3.7366547e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:47,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.65971 samples/s/p 3:38:21 } +2024-07-30 02:28:50,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 108/ 3125], loss: 1.291, per_step_time: 1413ms, lr: 3.807829e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:50,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.65829 samples/s/p 3:38:22 } +2024-07-30 02:28:53,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 110/ 3125], loss: 1.239, per_step_time: 1413ms, lr: 3.8790035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:53,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.65994 samples/s/p 3:38:15 } +2024-07-30 02:28:56,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 112/ 3125], loss: 1.071, per_step_time: 1415ms, lr: 3.950178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:56,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.65363 samples/s/p 3:38:27 } +2024-07-30 02:28:59,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 114/ 3125], loss: 1.148, per_step_time: 1414ms, lr: 4.021352e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:59,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.65687 samples/s/p 3:38:16 } +2024-07-30 02:29:02,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 116/ 3125], loss: 1.301, per_step_time: 1413ms, lr: 4.0925265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:02,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.66132 samples/s/p 3:38:03 } +2024-07-30 02:29:04,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 118/ 3125], loss: 0.982, per_step_time: 1413ms, lr: 4.163701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:04,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.65798 samples/s/p 3:38:08 } +2024-07-30 02:29:07,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 120/ 3125], loss: 1.209, per_step_time: 1414ms, lr: 4.234875e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:07,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.65593 samples/s/p 3:38:10 } +2024-07-30 02:29:10,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 122/ 3125], loss: 0.910, per_step_time: 1414ms, lr: 4.3060495e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:10,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.65603 samples/s/p 3:38:07 } +2024-07-30 02:29:13,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 124/ 3125], loss: 1.276, per_step_time: 1414ms, lr: 4.377224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:13,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.65388 samples/s/p 3:38:09 } +2024-07-30 02:29:16,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 126/ 3125], loss: 1.127, per_step_time: 1413ms, lr: 4.4483986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:16,178 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.65859 samples/s/p 3:37:56 } +2024-07-30 02:29:19,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 128/ 3125], loss: 0.940, per_step_time: 1413ms, lr: 4.519573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:19,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.65918 samples/s/p 3:37:51 } +2024-07-30 02:29:21,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 130/ 3125], loss: 1.026, per_step_time: 1413ms, lr: 4.5907473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:21,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.65904 samples/s/p 3:37:49 } +2024-07-30 02:29:24,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 132/ 3125], loss: 0.990, per_step_time: 1414ms, lr: 4.6619216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:24,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.65642 samples/s/p 3:37:52 } +2024-07-30 02:29:27,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 134/ 3125], loss: 1.413, per_step_time: 1413ms, lr: 4.733096e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:27,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.66034 samples/s/p 3:37:40 } +2024-07-30 02:29:30,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 136/ 3125], loss: 1.120, per_step_time: 1413ms, lr: 4.8042702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:30,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.65789 samples/s/p 3:37:43 } +2024-07-30 02:29:33,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 138/ 3125], loss: 0.952, per_step_time: 1415ms, lr: 4.8754446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:33,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.65310 samples/s/p 3:37:51 } +2024-07-30 02:29:36,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 140/ 3125], loss: 1.111, per_step_time: 1414ms, lr: 4.9466194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:36,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.65617 samples/s/p 3:37:41 } +2024-07-30 02:29:38,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 142/ 3125], loss: 1.099, per_step_time: 1414ms, lr: 5.0177937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:38,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.65590 samples/s/p 3:37:39 } +2024-07-30 02:29:41,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 144/ 3125], loss: 1.208, per_step_time: 1414ms, lr: 5.0889676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:41,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.65716 samples/s/p 3:37:33 } +2024-07-30 02:29:44,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 146/ 3125], loss: 1.044, per_step_time: 1413ms, lr: 5.160142e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:44,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.65962 samples/s/p 3:37:25 } +2024-07-30 02:29:47,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 148/ 3125], loss: 1.002, per_step_time: 1413ms, lr: 5.2313167e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:47,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.66032 samples/s/p 3:37:20 } +2024-07-30 02:29:50,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 150/ 3125], loss: 1.366, per_step_time: 1413ms, lr: 5.302491e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:50,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.66051 samples/s/p 3:37:17 } +2024-07-30 02:29:53,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 152/ 3125], loss: 0.954, per_step_time: 1413ms, lr: 5.3736658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:53,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.66040 samples/s/p 3:37:15 } +2024-07-30 02:29:55,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 154/ 3125], loss: 0.976, per_step_time: 1413ms, lr: 5.4448396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:55,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.65987 samples/s/p 3:37:13 } +2024-07-30 02:29:58,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 156/ 3125], loss: 1.448, per_step_time: 1415ms, lr: 5.516014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:58,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.65172 samples/s/p 3:37:29 } +2024-07-30 02:30:01,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 158/ 3125], loss: 1.134, per_step_time: 1413ms, lr: 5.5871883e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:01,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.65902 samples/s/p 3:37:09 } +2024-07-30 02:30:04,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 160/ 3125], loss: 1.046, per_step_time: 1413ms, lr: 5.658363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:04,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.65828 samples/s/p 3:37:08 } +2024-07-30 02:30:07,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 162/ 3125], loss: 1.002, per_step_time: 1414ms, lr: 5.7295374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:07,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.65502 samples/s/p 3:37:13 } +2024-07-30 02:30:10,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 164/ 3125], loss: 0.902, per_step_time: 1413ms, lr: 5.8007113e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:10,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.66130 samples/s/p 3:36:56 } +2024-07-30 02:30:12,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 166/ 3125], loss: 1.278, per_step_time: 1413ms, lr: 5.871886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:12,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.65941 samples/s/p 3:36:57 } +2024-07-30 02:30:15,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 168/ 3125], loss: 0.935, per_step_time: 1415ms, lr: 5.9430604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:15,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.65141 samples/s/p 3:37:13 } +2024-07-30 02:30:18,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 170/ 3125], loss: 0.847, per_step_time: 1413ms, lr: 6.0142347e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:18,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.66014 samples/s/p 3:36:50 } +2024-07-30 02:30:21,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 172/ 3125], loss: 0.977, per_step_time: 1413ms, lr: 6.0854086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:21,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.65912 samples/s/p 3:36:49 } +2024-07-30 02:30:24,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 174/ 3125], loss: 1.147, per_step_time: 1413ms, lr: 6.1565834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:24,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.66088 samples/s/p 3:36:42 } +2024-07-30 02:30:27,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 176/ 3125], loss: 0.650, per_step_time: 1413ms, lr: 6.2277577e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:27,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.66003 samples/s/p 3:36:42 } +2024-07-30 02:30:29,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 178/ 3125], loss: 0.672, per_step_time: 1413ms, lr: 6.2989325e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:29,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.65865 samples/s/p 3:36:42 } +2024-07-30 02:30:32,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 180/ 3125], loss: 0.873, per_step_time: 1413ms, lr: 6.370107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:32,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.66026 samples/s/p 3:36:35 } +2024-07-30 02:30:35,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 182/ 3125], loss: 1.075, per_step_time: 1416ms, lr: 6.4412807e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:35,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.64862 samples/s/p 3:36:59 } +2024-07-30 02:30:38,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 184/ 3125], loss: 0.945, per_step_time: 1414ms, lr: 6.512455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:38,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% | | 5.65749 samples/s/p 3:36:36 } +2024-07-30 02:30:41,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 186/ 3125], loss: 0.759, per_step_time: 1415ms, lr: 6.58363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:41,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% | | 5.65128 samples/s/p 3:36:48 } +2024-07-30 02:30:44,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 188/ 3125], loss: 0.980, per_step_time: 1414ms, lr: 6.654804e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:44,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.65633 samples/s/p 3:36:33 } +2024-07-30 02:30:46,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 190/ 3125], loss: 1.129, per_step_time: 1413ms, lr: 6.725979e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:46,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.66161 samples/s/p 3:36:18 } +2024-07-30 02:30:49,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 192/ 3125], loss: 0.925, per_step_time: 1413ms, lr: 6.7971528e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:49,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.65935 samples/s/p 3:36:21 } +2024-07-30 02:30:52,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 194/ 3125], loss: 0.785, per_step_time: 1413ms, lr: 6.868327e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:52,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.66034 samples/s/p 3:36:15 } +2024-07-30 02:30:55,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 196/ 3125], loss: 1.030, per_step_time: 1413ms, lr: 6.9395014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:55,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.65925 samples/s/p 3:36:15 } +2024-07-30 02:30:58,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 198/ 3125], loss: 0.733, per_step_time: 1413ms, lr: 7.010676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:58,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.65915 samples/s/p 3:36:12 } +2024-07-30 02:31:01,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 200/ 3125], loss: 0.688, per_step_time: 1414ms, lr: 7.0818505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:01,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.65414 samples/s/p 3:36:21 } +2024-07-30 02:31:03,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 202/ 3125], loss: 0.663, per_step_time: 1413ms, lr: 7.1530244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:03,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.65807 samples/s/p 3:36:09 } +2024-07-30 02:31:06,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 204/ 3125], loss: 0.988, per_step_time: 1415ms, lr: 7.224199e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:06,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.65366 samples/s/p 3:36:17 } +2024-07-30 02:31:09,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 206/ 3125], loss: 1.034, per_step_time: 1413ms, lr: 7.2953735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:09,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.65819 samples/s/p 3:36:03 } +2024-07-30 02:31:12,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 208/ 3125], loss: 0.978, per_step_time: 1414ms, lr: 7.366548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:12,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.65459 samples/s/p 3:36:09 } +2024-07-30 02:31:15,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 210/ 3125], loss: 0.827, per_step_time: 1413ms, lr: 7.4377217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:15,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.66074 samples/s/p 3:35:52 } +2024-07-30 02:31:18,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 212/ 3125], loss: 0.735, per_step_time: 1414ms, lr: 7.5088965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:18,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.65766 samples/s/p 3:35:56 } +2024-07-30 02:31:20,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 214/ 3125], loss: 0.890, per_step_time: 1414ms, lr: 7.580071e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:20,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.65577 samples/s/p 3:35:58 } +2024-07-30 02:31:23,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 216/ 3125], loss: 0.707, per_step_time: 1413ms, lr: 7.651245e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:23,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.66003 samples/s/p 3:35:45 } +2024-07-30 02:31:26,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 218/ 3125], loss: 0.747, per_step_time: 1413ms, lr: 7.7224195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:26,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.65816 samples/s/p 3:35:46 } +2024-07-30 02:31:29,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 220/ 3125], loss: 0.692, per_step_time: 1413ms, lr: 7.793594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:29,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.65847 samples/s/p 3:35:43 } +2024-07-30 02:31:32,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 222/ 3125], loss: 0.531, per_step_time: 1413ms, lr: 7.864768e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:32,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.66029 samples/s/p 3:35:36 } +2024-07-30 02:31:35,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 224/ 3125], loss: 0.898, per_step_time: 1415ms, lr: 7.935942e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:35,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.65096 samples/s/p 3:35:54 } +2024-07-30 02:31:37,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 226/ 3125], loss: 0.747, per_step_time: 1413ms, lr: 8.007118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:37,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.66097 samples/s/p 3:35:29 } +2024-07-30 02:31:40,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 228/ 3125], loss: 0.643, per_step_time: 1413ms, lr: 8.078292e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:40,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.65889 samples/s/p 3:35:31 } +2024-07-30 02:31:43,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 230/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 8.149465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:43,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.66022 samples/s/p 3:35:25 } +2024-07-30 02:31:46,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 232/ 3125], loss: 0.616, per_step_time: 1414ms, lr: 8.220641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:46,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.65749 samples/s/p 3:35:28 } +2024-07-30 02:31:49,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 234/ 3125], loss: 0.555, per_step_time: 1413ms, lr: 8.291815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:49,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.66099 samples/s/p 3:35:17 } +2024-07-30 02:31:52,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 236/ 3125], loss: 0.715, per_step_time: 1413ms, lr: 8.362989e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:52,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.66101 samples/s/p 3:35:15 } +2024-07-30 02:31:54,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 238/ 3125], loss: 0.645, per_step_time: 1413ms, lr: 8.434164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:54,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.65904 samples/s/p 3:35:16 } +2024-07-30 02:31:57,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 240/ 3125], loss: 0.602, per_step_time: 1413ms, lr: 8.505338e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:57,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.66002 samples/s/p 3:35:11 } +2024-07-30 02:32:00,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 242/ 3125], loss: 0.831, per_step_time: 1413ms, lr: 8.576512e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:00,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.65964 samples/s/p 3:35:09 } +2024-07-30 02:32:03,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 244/ 3125], loss: 0.463, per_step_time: 1413ms, lr: 8.647687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:03,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.65888 samples/s/p 3:35:08 } +2024-07-30 02:32:06,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 246/ 3125], loss: 0.654, per_step_time: 1413ms, lr: 8.718861e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:06,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.65803 samples/s/p 3:35:07 } +2024-07-30 02:32:09,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 248/ 3125], loss: 0.650, per_step_time: 1413ms, lr: 8.790035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:09,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.66013 samples/s/p 3:35:00 } +2024-07-30 02:32:11,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 250/ 3125], loss: 0.783, per_step_time: 1414ms, lr: 8.86121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:11,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.65426 samples/s/p 3:35:10 } +2024-07-30 02:32:14,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 252/ 3125], loss: 0.595, per_step_time: 1414ms, lr: 8.932384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:14,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.65646 samples/s/p 3:35:02 } +2024-07-30 02:32:17,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 254/ 3125], loss: 0.493, per_step_time: 1414ms, lr: 9.003558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:17,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.65677 samples/s/p 3:34:59 } +2024-07-30 02:32:20,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 256/ 3125], loss: 0.632, per_step_time: 1412ms, lr: 9.074733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:20,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.66215 samples/s/p 3:34:44 } +2024-07-30 02:32:23,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 258/ 3125], loss: 0.473, per_step_time: 1413ms, lr: 9.145907e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:23,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.65866 samples/s/p 3:34:49 } +2024-07-30 02:32:26,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 260/ 3125], loss: 0.446, per_step_time: 1413ms, lr: 9.217081e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:26,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.65880 samples/s/p 3:34:46 } +2024-07-30 02:32:28,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 262/ 3125], loss: 0.413, per_step_time: 1413ms, lr: 9.288256e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:28,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.66004 samples/s/p 3:34:40 } +2024-07-30 02:32:31,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 264/ 3125], loss: 0.407, per_step_time: 1413ms, lr: 9.359431e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:31,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.65866 samples/s/p 3:34:40 } +2024-07-30 02:32:34,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 266/ 3125], loss: 0.649, per_step_time: 1413ms, lr: 9.430605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:34,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.65865 samples/s/p 3:34:37 } +2024-07-30 02:32:37,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 268/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 9.501779e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:37,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.65544 samples/s/p 3:34:42 } +2024-07-30 02:32:40,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 270/ 3125], loss: 0.578, per_step_time: 1413ms, lr: 9.572954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:40,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.66006 samples/s/p 3:34:29 } +2024-07-30 02:32:43,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 272/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 9.644128e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:43,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.66027 samples/s/p 3:34:25 } +2024-07-30 02:32:45,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 274/ 3125], loss: 0.552, per_step_time: 1413ms, lr: 9.715302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:45,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.66149 samples/s/p 3:34:20 } +2024-07-30 02:32:48,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 276/ 3125], loss: 0.565, per_step_time: 1413ms, lr: 9.786476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:48,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.66073 samples/s/p 3:34:19 } +2024-07-30 02:32:51,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 278/ 3125], loss: 0.510, per_step_time: 1413ms, lr: 9.857651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:51,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.66097 samples/s/p 3:34:15 } +2024-07-30 02:32:54,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 280/ 3125], loss: 0.584, per_step_time: 1413ms, lr: 9.928825e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:54,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.66103 samples/s/p 3:34:12 } +2024-07-30 02:32:57,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 282/ 3125], loss: 0.441, per_step_time: 1413ms, lr: 1e-05, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:57,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.65992 samples/s/p 3:34:12 } +2024-07-30 02:33:00,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 284/ 3125], loss: 0.723, per_step_time: 1412ms, lr: 9.999999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:00,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.66241 samples/s/p 3:34:04 } +2024-07-30 02:33:02,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 286/ 3125], loss: 0.547, per_step_time: 1413ms, lr: 9.999995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:02,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.65955 samples/s/p 3:34:07 } +2024-07-30 02:33:05,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 288/ 3125], loss: 0.553, per_step_time: 1414ms, lr: 9.999989e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:05,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.65734 samples/s/p 3:34:09 } +2024-07-30 02:33:08,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 290/ 3125], loss: 0.653, per_step_time: 1412ms, lr: 9.999981e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:08,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.66179 samples/s/p 3:33:56 } +2024-07-30 02:33:11,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 292/ 3125], loss: 0.515, per_step_time: 1413ms, lr: 9.99997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:11,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.66064 samples/s/p 3:33:56 } +2024-07-30 02:33:14,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 294/ 3125], loss: 0.442, per_step_time: 1412ms, lr: 9.999957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:14,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.66175 samples/s/p 3:33:51 } +2024-07-30 02:33:17,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 296/ 3125], loss: 0.624, per_step_time: 1413ms, lr: 9.9999415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:17,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.65831 samples/s/p 3:33:56 } +2024-07-30 02:33:19,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 298/ 3125], loss: 0.522, per_step_time: 1413ms, lr: 9.999923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:19,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.65874 samples/s/p 3:33:52 } +2024-07-30 02:33:22,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 300/ 3125], loss: 0.537, per_step_time: 1414ms, lr: 9.999903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:22,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.65459 samples/s/p 3:33:59 } +2024-07-30 02:33:25,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 302/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 9.999881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:25,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.65830 samples/s/p 3:33:47 } +2024-07-30 02:33:28,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 304/ 3125], loss: 0.175, per_step_time: 1414ms, lr: 9.999855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:28,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.65482 samples/s/p 3:33:52 } +2024-07-30 02:33:31,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 306/ 3125], loss: 0.318, per_step_time: 1412ms, lr: 9.999828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:31,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.66242 samples/s/p 3:33:32 } +2024-07-30 02:33:34,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 308/ 3125], loss: 0.612, per_step_time: 1413ms, lr: 9.999798e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:34,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.65832 samples/s/p 3:33:39 } +2024-07-30 02:33:36,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 310/ 3125], loss: 0.388, per_step_time: 1413ms, lr: 9.999765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:36,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.65997 samples/s/p 3:33:32 } +2024-07-30 02:33:39,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 312/ 3125], loss: 0.609, per_step_time: 1413ms, lr: 9.9997305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:39,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.65981 samples/s/p 3:33:30 } +2024-07-30 02:33:42,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 314/ 3125], loss: 0.541, per_step_time: 1414ms, lr: 9.999694e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:42,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.65742 samples/s/p 3:33:32 } +2024-07-30 02:33:45,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 316/ 3125], loss: 0.526, per_step_time: 1413ms, lr: 9.999654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:45,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.65837 samples/s/p 3:33:27 } +2024-07-30 02:33:48,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 318/ 3125], loss: 0.440, per_step_time: 1413ms, lr: 9.999613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:48,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.66042 samples/s/p 3:33:20 } +2024-07-30 02:33:51,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 320/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 9.999569e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:51,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.65885 samples/s/p 3:33:21 } +2024-07-30 02:33:53,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 322/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 9.999521e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:53,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.66013 samples/s/p 3:33:15 } +2024-07-30 02:33:56,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 324/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 9.999473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:56,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.66048 samples/s/p 3:33:11 } +2024-07-30 02:33:59,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 326/ 3125], loss: 0.508, per_step_time: 1415ms, lr: 9.999422e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:59,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.65321 samples/s/p 3:33:25 } +2024-07-30 02:34:02,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 328/ 3125], loss: 0.454, per_step_time: 1413ms, lr: 9.999369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:02,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.65877 samples/s/p 3:33:10 } +2024-07-30 02:34:05,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 330/ 3125], loss: 0.249, per_step_time: 1426ms, lr: 9.999312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:05,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.60915 samples/s/p 3:35:00 } +2024-07-30 02:34:08,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 332/ 3125], loss: 0.287, per_step_time: 1414ms, lr: 9.999253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:08,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.65508 samples/s/p 3:33:12 } +2024-07-30 02:34:10,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 334/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 9.999193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:10,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.66071 samples/s/p 3:32:57 } +2024-07-30 02:34:13,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 336/ 3125], loss: 0.487, per_step_time: 1413ms, lr: 9.99913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:13,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.65878 samples/s/p 3:32:58 } +2024-07-30 02:34:16,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 338/ 3125], loss: 0.379, per_step_time: 1413ms, lr: 9.999064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:16,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.66042 samples/s/p 3:32:52 } +2024-07-30 02:34:19,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 340/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 9.998996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:19,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.65988 samples/s/p 3:32:50 } +2024-07-30 02:34:22,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 342/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 9.998925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:22,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.66018 samples/s/p 3:32:47 } +2024-07-30 02:34:25,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 344/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 9.998853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:25,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.65902 samples/s/p 3:32:46 } +2024-07-30 02:34:27,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 346/ 3125], loss: 0.434, per_step_time: 1412ms, lr: 9.998778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:27,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.66329 samples/s/p 3:32:34 } +2024-07-30 02:34:30,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 348/ 3125], loss: 0.441, per_step_time: 1413ms, lr: 9.9987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:30,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.65908 samples/s/p 3:32:41 } +2024-07-30 02:34:33,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 350/ 3125], loss: 0.393, per_step_time: 1416ms, lr: 9.99862e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:33,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.64721 samples/s/p 3:33:05 } +2024-07-30 02:34:36,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 352/ 3125], loss: 0.227, per_step_time: 1414ms, lr: 9.998537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:36,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.65554 samples/s/p 3:32:43 } +2024-07-30 02:34:39,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 354/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 9.998453e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:39,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.66137 samples/s/p 3:32:27 } +2024-07-30 02:34:42,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 356/ 3125], loss: 0.453, per_step_time: 1413ms, lr: 9.998366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:42,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.65819 samples/s/p 3:32:31 } +2024-07-30 02:34:45,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 358/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 9.998276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:45,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.66040 samples/s/p 3:32:23 } +2024-07-30 02:34:47,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 360/ 3125], loss: 0.478, per_step_time: 1414ms, lr: 9.998184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:47,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.65647 samples/s/p 3:32:30 } +2024-07-30 02:34:50,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 362/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 9.99809e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:50,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.65892 samples/s/p 3:32:21 } +2024-07-30 02:34:53,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 364/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 9.997993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:53,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.65971 samples/s/p 3:32:17 } +2024-07-30 02:34:56,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 366/ 3125], loss: 0.439, per_step_time: 1413ms, lr: 9.997894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:56,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.66005 samples/s/p 3:32:13 } +2024-07-30 02:34:59,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 368/ 3125], loss: 0.439, per_step_time: 1413ms, lr: 9.997793e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:59,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.66158 samples/s/p 3:32:07 } +2024-07-30 02:35:02,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 370/ 3125], loss: 0.284, per_step_time: 1425ms, lr: 9.99769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:02,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.61076 samples/s/p 3:33:59 } +2024-07-30 02:35:04,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 372/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 9.997583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:04,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |█ | 5.65961 samples/s/p 3:32:05 } +2024-07-30 02:35:07,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 374/ 3125], loss: 0.374, per_step_time: 1414ms, lr: 9.997474e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:07,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |█ | 5.65546 samples/s/p 3:32:12 } +2024-07-30 02:35:10,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 376/ 3125], loss: 0.395, per_step_time: 1413ms, lr: 9.997363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:10,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.66063 samples/s/p 3:31:58 } +2024-07-30 02:35:13,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 378/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 9.997249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:13,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.65956 samples/s/p 3:31:57 } +2024-07-30 02:35:16,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 380/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 9.997134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:16,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.65731 samples/s/p 3:31:59 } +2024-07-30 02:35:19,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 382/ 3125], loss: 0.343, per_step_time: 1414ms, lr: 9.997016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:19,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.65755 samples/s/p 3:31:56 } +2024-07-30 02:35:21,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 384/ 3125], loss: 0.253, per_step_time: 1414ms, lr: 9.996896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:21,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.65755 samples/s/p 3:31:53 } +2024-07-30 02:35:24,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 386/ 3125], loss: 0.075, per_step_time: 1414ms, lr: 9.996773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:24,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.65580 samples/s/p 3:31:54 } +2024-07-30 02:35:27,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 388/ 3125], loss: 0.596, per_step_time: 1414ms, lr: 9.996647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:27,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.65658 samples/s/p 3:31:50 } +2024-07-30 02:35:30,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 390/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 9.996519e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:30,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.66145 samples/s/p 3:31:36 } +2024-07-30 02:35:33,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 392/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 9.996389e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:33,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.66065 samples/s/p 3:31:35 } +2024-07-30 02:35:36,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 394/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 9.996256e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:36,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.66109 samples/s/p 3:31:31 } +2024-07-30 02:35:38,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 396/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 9.996122e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:38,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.65923 samples/s/p 3:31:32 } +2024-07-30 02:35:41,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 398/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 9.995984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:41,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.65819 samples/s/p 3:31:32 } +2024-07-30 02:35:44,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 400/ 3125], loss: 0.145, per_step_time: 1414ms, lr: 9.995845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:44,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.65558 samples/s/p 3:31:35 } +2024-07-30 02:35:47,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 402/ 3125], loss: 0.443, per_step_time: 1413ms, lr: 9.995703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:47,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.65949 samples/s/p 3:31:23 } +2024-07-30 02:35:50,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 404/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 9.995558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:50,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.65965 samples/s/p 3:31:20 } +2024-07-30 02:35:53,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 406/ 3125], loss: 0.283, per_step_time: 1414ms, lr: 9.995412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:53,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.65738 samples/s/p 3:31:22 } +2024-07-30 02:35:55,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 408/ 3125], loss: 0.248, per_step_time: 1414ms, lr: 9.995262e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:55,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.65576 samples/s/p 3:31:23 } +2024-07-30 02:35:58,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 410/ 3125], loss: 0.428, per_step_time: 1413ms, lr: 9.995111e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:58,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.66103 samples/s/p 3:31:09 } +2024-07-30 02:36:01,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 412/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 9.994957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:01,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.65852 samples/s/p 3:31:11 } +2024-07-30 02:36:04,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 414/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 9.994801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:04,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.66058 samples/s/p 3:31:04 } +2024-07-30 02:36:07,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 416/ 3125], loss: 0.382, per_step_time: 1414ms, lr: 9.994643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:07,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.65707 samples/s/p 3:31:09 } +2024-07-30 02:36:10,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 418/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 9.994482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:10,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.66030 samples/s/p 3:30:59 } +2024-07-30 02:36:12,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 420/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 9.994317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:12,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.66154 samples/s/p 3:30:53 } +2024-07-30 02:36:15,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 422/ 3125], loss: 0.357, per_step_time: 1413ms, lr: 9.994152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:15,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.65827 samples/s/p 3:30:58 } +2024-07-30 02:36:18,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 424/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 9.993983e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:18,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.66028 samples/s/p 3:30:50 } +2024-07-30 02:36:21,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 426/ 3125], loss: 0.266, per_step_time: 1412ms, lr: 9.9938125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:21,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.66191 samples/s/p 3:30:44 } +2024-07-30 02:36:24,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 428/ 3125], loss: 0.408, per_step_time: 1413ms, lr: 9.99364e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:24,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.66049 samples/s/p 3:30:44 } +2024-07-30 02:36:27,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 430/ 3125], loss: 0.458, per_step_time: 1413ms, lr: 9.993465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:27,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.65958 samples/s/p 3:30:44 } +2024-07-30 02:36:29,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 432/ 3125], loss: 0.196, per_step_time: 1414ms, lr: 9.993287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:29,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.65693 samples/s/p 3:30:47 } +2024-07-30 02:36:32,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 434/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 9.993107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:32,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.65965 samples/s/p 3:30:38 } +2024-07-30 02:36:35,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 436/ 3125], loss: 0.404, per_step_time: 1414ms, lr: 9.992924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:35,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.65618 samples/s/p 3:30:43 } +2024-07-30 02:36:38,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 438/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 9.992738e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:38,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.65904 samples/s/p 3:30:33 } +2024-07-30 02:36:41,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 440/ 3125], loss: 0.661, per_step_time: 1413ms, lr: 9.992552e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:41,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.65914 samples/s/p 3:30:30 } +2024-07-30 02:36:44,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 442/ 3125], loss: 0.255, per_step_time: 1416ms, lr: 9.992362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:44,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.64727 samples/s/p 3:30:54 } +2024-07-30 02:36:46,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 444/ 3125], loss: 0.383, per_step_time: 1414ms, lr: 9.99217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:46,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.65760 samples/s/p 3:30:28 } +2024-07-30 02:36:49,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 446/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 9.991976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:49,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.66032 samples/s/p 3:30:19 } +2024-07-30 02:36:52,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 448/ 3125], loss: 0.331, per_step_time: 1415ms, lr: 9.991779e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:52,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.65209 samples/s/p 3:30:35 } +2024-07-30 02:36:55,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 450/ 3125], loss: 0.209, per_step_time: 1412ms, lr: 9.99158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:55,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.66257 samples/s/p 3:30:09 } +2024-07-30 02:36:58,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 452/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 9.991378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:58,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.65861 samples/s/p 3:30:15 } +2024-07-30 02:37:01,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 454/ 3125], loss: 0.512, per_step_time: 1414ms, lr: 9.991173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:01,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.65739 samples/s/p 3:30:15 } +2024-07-30 02:37:03,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 456/ 3125], loss: 0.390, per_step_time: 1414ms, lr: 9.990968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:03,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.65491 samples/s/p 3:30:17 } +2024-07-30 02:37:06,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 458/ 3125], loss: 0.349, per_step_time: 1413ms, lr: 9.990758e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:06,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.65872 samples/s/p 3:30:06 } +2024-07-30 02:37:09,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 460/ 3125], loss: 0.634, per_step_time: 1413ms, lr: 9.990547e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:09,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.66162 samples/s/p 3:29:57 } +2024-07-30 02:37:12,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 462/ 3125], loss: 0.333, per_step_time: 1412ms, lr: 9.990334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:12,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.66198 samples/s/p 3:29:53 } +2024-07-30 02:37:15,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 464/ 3125], loss: 0.291, per_step_time: 1414ms, lr: 9.990118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:15,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.65475 samples/s/p 3:30:06 } +2024-07-30 02:37:18,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 466/ 3125], loss: 0.124, per_step_time: 1413ms, lr: 9.9899e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:18,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.65978 samples/s/p 3:29:52 } +2024-07-30 02:37:20,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 468/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 9.98968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:20,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.66150 samples/s/p 3:29:46 } +2024-07-30 02:37:23,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 470/ 3125], loss: 0.148, per_step_time: 1413ms, lr: 9.989456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:23,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.66137 samples/s/p 3:29:43 } +2024-07-30 02:37:26,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 472/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 9.98923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:26,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.66013 samples/s/p 3:29:43 } +2024-07-30 02:37:29,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 474/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 9.989003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:29,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.65973 samples/s/p 3:29:41 } +2024-07-30 02:37:32,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 476/ 3125], loss: 0.678, per_step_time: 1413ms, lr: 9.988773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:32,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.65989 samples/s/p 3:29:38 } +2024-07-30 02:37:35,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 478/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 9.98854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:35,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.65868 samples/s/p 3:29:38 } +2024-07-30 02:37:37,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 480/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 9.9883055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:37,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.65918 samples/s/p 3:29:34 } +2024-07-30 02:37:40,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 482/ 3125], loss: 0.129, per_step_time: 1414ms, lr: 9.988068e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:40,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.65577 samples/s/p 3:29:39 } +2024-07-30 02:37:43,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 484/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 9.987828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:43,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.65950 samples/s/p 3:29:27 } +2024-07-30 02:37:46,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 486/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 9.987586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:46,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.65876 samples/s/p 3:29:26 } +2024-07-30 02:37:49,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 488/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 9.987341e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:49,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.65853 samples/s/p 3:29:24 } +2024-07-30 02:37:52,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 490/ 3125], loss: 0.480, per_step_time: 1413ms, lr: 9.987094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:52,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.66067 samples/s/p 3:29:16 } +2024-07-30 02:37:54,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 492/ 3125], loss: 0.380, per_step_time: 1414ms, lr: 9.986845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:54,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.65722 samples/s/p 3:29:21 } +2024-07-30 02:37:57,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 494/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 9.986594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:57,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.65786 samples/s/p 3:29:17 } +2024-07-30 02:38:00,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 496/ 3125], loss: 0.252, per_step_time: 1414ms, lr: 9.986339e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:00,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.65651 samples/s/p 3:29:17 } +2024-07-30 02:38:03,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 498/ 3125], loss: 0.270, per_step_time: 1414ms, lr: 9.986084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:03,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.65721 samples/s/p 3:29:13 } +2024-07-30 02:38:06,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 500/ 3125], loss: 0.292, per_step_time: 1414ms, lr: 9.985824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:06,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.65657 samples/s/p 3:29:11 } +2024-07-30 02:38:09,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 502/ 3125], loss: 0.396, per_step_time: 1413ms, lr: 9.985563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:09,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.66047 samples/s/p 3:29:00 } +2024-07-30 02:38:11,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 504/ 3125], loss: 0.282, per_step_time: 1412ms, lr: 9.9853005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:11,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.66212 samples/s/p 3:28:53 } +2024-07-30 02:38:14,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 506/ 3125], loss: 0.261, per_step_time: 1414ms, lr: 9.985034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:14,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.65694 samples/s/p 3:29:02 } +2024-07-30 02:38:17,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 508/ 3125], loss: 0.528, per_step_time: 1413ms, lr: 9.984766e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:17,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.65997 samples/s/p 3:28:52 } +2024-07-30 02:38:20,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 510/ 3125], loss: 0.415, per_step_time: 1413ms, lr: 9.984494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:20,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.65966 samples/s/p 3:28:50 } +2024-07-30 02:38:23,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 512/ 3125], loss: 0.172, per_step_time: 1415ms, lr: 9.984221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:23,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.65237 samples/s/p 3:29:04 } +2024-07-30 02:38:26,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 514/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 9.983946e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:26,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.66040 samples/s/p 3:28:43 } +2024-07-30 02:38:28,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 516/ 3125], loss: 0.139, per_step_time: 1413ms, lr: 9.983668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:28,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.66092 samples/s/p 3:28:39 } +2024-07-30 02:38:31,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 518/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 9.983388e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:31,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.66052 samples/s/p 3:28:37 } +2024-07-30 02:38:34,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 520/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 9.983105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:34,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.65940 samples/s/p 3:28:37 } +2024-07-30 02:38:37,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 522/ 3125], loss: 0.416, per_step_time: 1413ms, lr: 9.98282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:37,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.66021 samples/s/p 3:28:32 } +2024-07-30 02:38:40,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 524/ 3125], loss: 0.506, per_step_time: 1413ms, lr: 9.982533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:40,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.65956 samples/s/p 3:28:31 } +2024-07-30 02:38:43,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 526/ 3125], loss: 0.324, per_step_time: 1412ms, lr: 9.982244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:43,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.66254 samples/s/p 3:28:21 } +2024-07-30 02:38:45,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 528/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 9.981952e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:45,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.66091 samples/s/p 3:28:22 } +2024-07-30 02:38:48,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 530/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 9.981657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:48,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.65989 samples/s/p 3:28:22 } +2024-07-30 02:38:51,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 532/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 9.981361e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:51,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.66040 samples/s/p 3:28:18 } +2024-07-30 02:38:54,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 534/ 3125], loss: 0.335, per_step_time: 1413ms, lr: 9.981061e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:54,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.66130 samples/s/p 3:28:13 } +2024-07-30 02:38:57,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 536/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 9.980759e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:57,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.66003 samples/s/p 3:28:13 } +2024-07-30 02:39:00,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 538/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 9.980456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:00,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.66106 samples/s/p 3:28:08 } +2024-07-30 02:39:02,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 540/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 9.980149e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:02,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.66079 samples/s/p 3:28:05 } +2024-07-30 02:39:05,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 542/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 9.97984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:05,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.66026 samples/s/p 3:28:04 } +2024-07-30 02:39:08,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 544/ 3125], loss: 0.380, per_step_time: 1414ms, lr: 9.979529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:08,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.65671 samples/s/p 3:28:09 } +2024-07-30 02:39:11,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 546/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 9.979216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:11,448 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.65441 samples/s/p 3:28:11 } +2024-07-30 02:39:14,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 548/ 3125], loss: 0.353, per_step_time: 1414ms, lr: 9.9788995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:14,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.65623 samples/s/p 3:28:04 } +2024-07-30 02:39:17,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 550/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 9.978581e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:17,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.65916 samples/s/p 3:27:55 } +2024-07-30 02:39:19,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 552/ 3125], loss: 0.391, per_step_time: 1415ms, lr: 9.978261e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:19,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.65170 samples/s/p 3:28:08 } +2024-07-30 02:39:22,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 554/ 3125], loss: 0.214, per_step_time: 1414ms, lr: 9.977938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:22,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.65716 samples/s/p 3:27:54 } +2024-07-30 02:39:25,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 556/ 3125], loss: 0.356, per_step_time: 1413ms, lr: 9.9776125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:25,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.66002 samples/s/p 3:27:44 } +2024-07-30 02:39:28,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 558/ 3125], loss: 0.101, per_step_time: 1413ms, lr: 9.977284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:28,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.66060 samples/s/p 3:27:40 } +2024-07-30 02:39:31,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 560/ 3125], loss: 0.340, per_step_time: 1412ms, lr: 9.976954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:31,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.66173 samples/s/p 3:27:35 } +2024-07-30 02:39:34,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 562/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 9.976621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:34,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.66002 samples/s/p 3:27:36 } +2024-07-30 02:39:36,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 564/ 3125], loss: 0.431, per_step_time: 1413ms, lr: 9.976287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:36,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |███ | 5.66113 samples/s/p 3:27:31 } +2024-07-30 02:39:39,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 566/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 9.97595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:39,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |███ | 5.65966 samples/s/p 3:27:31 } +2024-07-30 02:39:42,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 568/ 3125], loss: 0.368, per_step_time: 1413ms, lr: 9.97561e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:42,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.66102 samples/s/p 3:27:25 } +2024-07-30 02:39:45,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 570/ 3125], loss: 0.296, per_step_time: 1414ms, lr: 9.975269e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:45,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.65498 samples/s/p 3:27:36 } +2024-07-30 02:39:48,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 572/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 9.974923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:48,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.65903 samples/s/p 3:27:24 } +2024-07-30 02:39:51,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 574/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 9.974578e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:51,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.65870 samples/s/p 3:27:22 } +2024-07-30 02:39:53,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 576/ 3125], loss: 0.225, per_step_time: 1414ms, lr: 9.974228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:53,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.65546 samples/s/p 3:27:26 } +2024-07-30 02:39:56,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 578/ 3125], loss: 0.401, per_step_time: 1414ms, lr: 9.973876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:56,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.65699 samples/s/p 3:27:20 } +2024-07-30 02:39:59,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 580/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 9.9735225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:59,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.65931 samples/s/p 3:27:12 } +2024-07-30 02:40:02,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 582/ 3125], loss: 0.161, per_step_time: 1414ms, lr: 9.973166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:02,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.65745 samples/s/p 3:27:13 } +2024-07-30 02:40:05,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 584/ 3125], loss: 0.215, per_step_time: 1418ms, lr: 9.972808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:05,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.63935 samples/s/p 3:27:50 } +2024-07-30 02:40:08,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 586/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 9.972447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:08,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.66130 samples/s/p 3:26:59 } +2024-07-30 02:40:10,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 588/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 9.972084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:10,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.65781 samples/s/p 3:27:04 } +2024-07-30 02:40:13,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 590/ 3125], loss: 0.234, per_step_time: 1412ms, lr: 9.971717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:13,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.66183 samples/s/p 3:26:52 } +2024-07-30 02:40:16,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 592/ 3125], loss: 0.297, per_step_time: 1414ms, lr: 9.971349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:16,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.65668 samples/s/p 3:27:01 } +2024-07-30 02:40:19,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 594/ 3125], loss: 0.353, per_step_time: 1413ms, lr: 9.970979e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:19,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.65951 samples/s/p 3:26:52 } +2024-07-30 02:40:22,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 596/ 3125], loss: 0.372, per_step_time: 1414ms, lr: 9.970605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:22,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.65714 samples/s/p 3:26:54 } +2024-07-30 02:40:25,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 598/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 9.970231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:25,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.65925 samples/s/p 3:26:47 } +2024-07-30 02:40:27,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 600/ 3125], loss: 0.290, per_step_time: 1415ms, lr: 9.969853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:27,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.65278 samples/s/p 3:26:58 } +2024-07-30 02:40:30,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 602/ 3125], loss: 0.510, per_step_time: 1413ms, lr: 9.969473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:30,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.65931 samples/s/p 3:26:41 } +2024-07-30 02:40:33,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 604/ 3125], loss: 0.393, per_step_time: 1413ms, lr: 9.96909e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:33,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.65898 samples/s/p 3:26:39 } +2024-07-30 02:40:36,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 606/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 9.968706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:36,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.65907 samples/s/p 3:26:36 } +2024-07-30 02:40:39,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 608/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 9.968318e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:39,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.65985 samples/s/p 3:26:31 } +2024-07-30 02:40:42,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 610/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 9.967929e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:42,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.66169 samples/s/p 3:26:24 } +2024-07-30 02:40:44,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 612/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 9.967536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:44,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.66108 samples/s/p 3:26:23 } +2024-07-30 02:40:47,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 614/ 3125], loss: 0.292, per_step_time: 1413ms, lr: 9.967143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:47,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.65803 samples/s/p 3:26:27 } +2024-07-30 02:40:50,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 616/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 9.966746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:50,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.65959 samples/s/p 3:26:21 } +2024-07-30 02:40:53,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 618/ 3125], loss: 0.285, per_step_time: 1415ms, lr: 9.966347e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:53,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.65156 samples/s/p 3:26:35 } +2024-07-30 02:40:56,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 620/ 3125], loss: 0.511, per_step_time: 1413ms, lr: 9.9659455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:56,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.66147 samples/s/p 3:26:11 } +2024-07-30 02:40:59,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 622/ 3125], loss: 0.245, per_step_time: 1414ms, lr: 9.965543e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:59,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.65634 samples/s/p 3:26:19 } +2024-07-30 02:41:02,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 624/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 9.965136e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:02,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.65997 samples/s/p 3:26:08 } +2024-07-30 02:41:04,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 626/ 3125], loss: 0.162, per_step_time: 1412ms, lr: 9.964728e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:04,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.66197 samples/s/p 3:26:01 } +2024-07-30 02:41:07,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 628/ 3125], loss: 0.399, per_step_time: 1413ms, lr: 9.964317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:07,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.65871 samples/s/p 3:26:06 } +2024-07-30 02:41:10,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 630/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 9.963903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:10,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.66041 samples/s/p 3:25:59 } +2024-07-30 02:41:13,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 632/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 9.963488e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:13,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.65830 samples/s/p 3:26:01 } +2024-07-30 02:41:16,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 634/ 3125], loss: 0.229, per_step_time: 1415ms, lr: 9.96307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:16,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.65169 samples/s/p 3:26:12 } +2024-07-30 02:41:19,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 636/ 3125], loss: 0.381, per_step_time: 1414ms, lr: 9.96265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:19,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.65586 samples/s/p 3:26:00 } +2024-07-30 02:41:21,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 638/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 9.9622275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:21,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.65930 samples/s/p 3:25:50 } +2024-07-30 02:41:24,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 640/ 3125], loss: 0.256, per_step_time: 1412ms, lr: 9.961802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:24,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.66271 samples/s/p 3:25:40 } +2024-07-30 02:41:27,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 642/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 9.961374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:27,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.65914 samples/s/p 3:25:45 } +2024-07-30 02:41:30,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 644/ 3125], loss: 0.269, per_step_time: 1414ms, lr: 9.960944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:30,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.65742 samples/s/p 3:25:46 } +2024-07-30 02:41:33,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 646/ 3125], loss: 0.375, per_step_time: 1414ms, lr: 9.960513e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:33,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.65441 samples/s/p 3:25:50 } +2024-07-30 02:41:36,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 648/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 9.9600775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:36,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.65926 samples/s/p 3:25:36 } +2024-07-30 02:41:38,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 650/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 9.959642e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:38,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.65887 samples/s/p 3:25:34 } +2024-07-30 02:41:41,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 652/ 3125], loss: 0.269, per_step_time: 1414ms, lr: 9.9592025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:41,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.65414 samples/s/p 3:25:42 } +2024-07-30 02:41:44,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 654/ 3125], loss: 0.319, per_step_time: 1414ms, lr: 9.9587605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:44,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.65516 samples/s/p 3:25:37 } +2024-07-30 02:41:47,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 656/ 3125], loss: 0.389, per_step_time: 1414ms, lr: 9.958317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:47,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.65659 samples/s/p 3:25:31 } +2024-07-30 02:41:50,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 658/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 9.95787e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:50,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.65976 samples/s/p 3:25:21 } +2024-07-30 02:41:53,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 660/ 3125], loss: 0.096, per_step_time: 1413ms, lr: 9.957421e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:53,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.66132 samples/s/p 3:25:15 } +2024-07-30 02:41:55,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 662/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 9.95697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:55,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.66029 samples/s/p 3:25:14 } +2024-07-30 02:41:58,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 664/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 9.956517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:58,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.65887 samples/s/p 3:25:14 } +2024-07-30 02:42:01,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 666/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 9.95606e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:01,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.66104 samples/s/p 3:25:07 } +2024-07-30 02:42:04,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 668/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 9.955603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:04,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.65919 samples/s/p 3:25:08 } +2024-07-30 02:42:07,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 670/ 3125], loss: 0.103, per_step_time: 1413ms, lr: 9.955142e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:07,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.66053 samples/s/p 3:25:02 } +2024-07-30 02:42:10,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 672/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 9.95468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:10,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.66130 samples/s/p 3:24:58 } +2024-07-30 02:42:12,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 674/ 3125], loss: 0.503, per_step_time: 1413ms, lr: 9.954214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:12,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.66090 samples/s/p 3:24:56 } +2024-07-30 02:42:15,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 676/ 3125], loss: 0.388, per_step_time: 1415ms, lr: 9.953746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:15,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.65338 samples/s/p 3:25:09 } +2024-07-30 02:42:18,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 678/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 9.953275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:18,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.65964 samples/s/p 3:24:53 } +2024-07-30 02:42:21,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 680/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 9.952803e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:21,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.66069 samples/s/p 3:24:48 } +2024-07-30 02:42:24,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 682/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 9.9523295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:24,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.65789 samples/s/p 3:24:51 } +2024-07-30 02:42:27,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 684/ 3125], loss: 0.480, per_step_time: 1414ms, lr: 9.951851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:27,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.65667 samples/s/p 3:24:51 } +2024-07-30 02:42:29,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 686/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 9.951372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:29,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.66072 samples/s/p 3:24:39 } +2024-07-30 02:42:32,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 688/ 3125], loss: 0.346, per_step_time: 1416ms, lr: 9.950891e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:32,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.64869 samples/s/p 3:25:03 } +2024-07-30 02:42:35,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 690/ 3125], loss: 0.391, per_step_time: 1414ms, lr: 9.950406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:35,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.65621 samples/s/p 3:24:43 } +2024-07-30 02:42:38,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 692/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 9.94992e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:38,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.65920 samples/s/p 3:24:34 } +2024-07-30 02:42:41,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 694/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 9.949431e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:41,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.66098 samples/s/p 3:24:27 } +2024-07-30 02:42:44,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 696/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 9.948939e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:44,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.66058 samples/s/p 3:24:25 } +2024-07-30 02:42:46,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 698/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 9.948445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:46,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.66072 samples/s/p 3:24:22 } +2024-07-30 02:42:49,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 700/ 3125], loss: 0.344, per_step_time: 1413ms, lr: 9.947949e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:49,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.65820 samples/s/p 3:24:25 } +2024-07-30 02:42:52,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 702/ 3125], loss: 0.373, per_step_time: 1416ms, lr: 9.947451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:52,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.64854 samples/s/p 3:24:43 } +2024-07-30 02:42:55,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 704/ 3125], loss: 0.209, per_step_time: 1414ms, lr: 9.946951e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:55,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.65455 samples/s/p 3:24:27 } +2024-07-30 02:42:58,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 706/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 9.946447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:58,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.66153 samples/s/p 3:24:09 } +2024-07-30 02:43:01,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 708/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 9.945942e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:01,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.65889 samples/s/p 3:24:12 } +2024-07-30 02:43:03,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 710/ 3125], loss: 0.420, per_step_time: 1412ms, lr: 9.945434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:03,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.66186 samples/s/p 3:24:03 } +2024-07-30 02:43:06,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 712/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 9.9449235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:06,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.66001 samples/s/p 3:24:04 } +2024-07-30 02:43:09,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 714/ 3125], loss: 0.459, per_step_time: 1412ms, lr: 9.944411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:09,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.66270 samples/s/p 3:23:55 } +2024-07-30 02:43:12,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 716/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 9.943897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:12,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.66134 samples/s/p 3:23:55 } +2024-07-30 02:43:15,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 718/ 3125], loss: 0.225, per_step_time: 1412ms, lr: 9.943379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:15,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.66227 samples/s/p 3:23:51 } +2024-07-30 02:43:18,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 720/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 9.942859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:18,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.66155 samples/s/p 3:23:49 } +2024-07-30 02:43:20,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 722/ 3125], loss: 0.310, per_step_time: 1414ms, lr: 9.942337e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:20,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.65600 samples/s/p 3:23:59 } +2024-07-30 02:43:23,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 724/ 3125], loss: 0.183, per_step_time: 1415ms, lr: 9.941812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:23,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.65351 samples/s/p 3:24:01 } +2024-07-30 02:43:26,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 726/ 3125], loss: 0.421, per_step_time: 1414ms, lr: 9.941286e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:26,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.65680 samples/s/p 3:23:51 } +2024-07-30 02:43:29,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 728/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 9.940757e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:29,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.65868 samples/s/p 3:23:44 } +2024-07-30 02:43:32,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 730/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 9.940226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:32,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.65808 samples/s/p 3:23:43 } +2024-07-30 02:43:35,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 732/ 3125], loss: 0.202, per_step_time: 1414ms, lr: 9.939692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:35,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.65692 samples/s/p 3:23:42 } +2024-07-30 02:43:37,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 734/ 3125], loss: 0.373, per_step_time: 1413ms, lr: 9.9391555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:37,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.65995 samples/s/p 3:23:33 } +2024-07-30 02:43:40,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 736/ 3125], loss: 0.418, per_step_time: 1413ms, lr: 9.938616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:40,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.66022 samples/s/p 3:23:30 } +2024-07-30 02:43:43,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 738/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 9.938076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:43,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.66063 samples/s/p 3:23:26 } +2024-07-30 02:43:46,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 740/ 3125], loss: 0.420, per_step_time: 1413ms, lr: 9.937533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:46,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.66062 samples/s/p 3:23:23 } +2024-07-30 02:43:49,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 742/ 3125], loss: 0.164, per_step_time: 1414ms, lr: 9.936987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:49,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.65663 samples/s/p 3:23:29 } +2024-07-30 02:43:52,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 744/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 9.93644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:52,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.65781 samples/s/p 3:23:24 } +2024-07-30 02:43:54,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 746/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 9.935889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:54,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |███ | 5.65818 samples/s/p 3:23:20 } +2024-07-30 02:43:57,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 748/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 9.9353365e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:57,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |███ | 5.65787 samples/s/p 3:23:18 } +2024-07-30 02:44:00,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 750/ 3125], loss: 0.195, per_step_time: 1414ms, lr: 9.934782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:00,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.65534 samples/s/p 3:23:20 } +2024-07-30 02:44:03,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 752/ 3125], loss: 0.465, per_step_time: 1414ms, lr: 9.934223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:03,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.65478 samples/s/p 3:23:19 } +2024-07-30 02:44:06,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 754/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 9.933664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:06,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.65855 samples/s/p 3:23:08 } +2024-07-30 02:44:09,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 756/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 9.933102e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:09,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.66029 samples/s/p 3:23:01 } +2024-07-30 02:44:11,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 758/ 3125], loss: 0.390, per_step_time: 1413ms, lr: 9.932538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:11,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.66030 samples/s/p 3:22:58 } +2024-07-30 02:44:14,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 760/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 9.931971e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:14,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.66052 samples/s/p 3:22:55 } +2024-07-30 02:44:17,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 762/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 9.931402e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:17,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.65983 samples/s/p 3:22:54 } +2024-07-30 02:44:20,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 764/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 9.93083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:20,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.65873 samples/s/p 3:22:53 } +2024-07-30 02:44:23,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 766/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 9.930256e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:23,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.66112 samples/s/p 3:22:45 } +2024-07-30 02:44:26,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 768/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 9.92968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:26,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.65894 samples/s/p 3:22:47 } +2024-07-30 02:44:28,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 770/ 3125], loss: 0.407, per_step_time: 1417ms, lr: 9.929101e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:28,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.64301 samples/s/p 3:23:19 } +2024-07-30 02:44:31,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 772/ 3125], loss: 0.230, per_step_time: 1421ms, lr: 9.928521e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:31,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.62818 samples/s/p 3:23:48 } +2024-07-30 02:44:34,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 774/ 3125], loss: 0.346, per_step_time: 1417ms, lr: 9.927937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:34,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.64510 samples/s/p 3:23:08 } +2024-07-30 02:44:37,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 776/ 3125], loss: 0.453, per_step_time: 1416ms, lr: 9.927351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:37,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.64822 samples/s/p 3:22:59 } +2024-07-30 02:44:40,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 778/ 3125], loss: 0.332, per_step_time: 1416ms, lr: 9.926764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:40,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.64908 samples/s/p 3:22:54 } +2024-07-30 02:44:43,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 780/ 3125], loss: 0.240, per_step_time: 1415ms, lr: 9.926173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:43,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.64991 samples/s/p 3:22:50 } +2024-07-30 02:44:45,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 782/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 9.92558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:45,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.65901 samples/s/p 3:22:27 } +2024-07-30 02:44:48,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 784/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 9.9249855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:48,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.65973 samples/s/p 3:22:23 } +2024-07-30 02:44:51,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 786/ 3125], loss: 0.095, per_step_time: 1414ms, lr: 9.924388e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:51,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.65425 samples/s/p 3:22:32 } +2024-07-30 02:44:54,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 788/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 9.923788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:54,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.65910 samples/s/p 3:22:19 } +2024-07-30 02:44:57,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 790/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 9.923186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:57,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.65951 samples/s/p 3:22:15 } +2024-07-30 02:45:00,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 792/ 3125], loss: 0.344, per_step_time: 1413ms, lr: 9.922582e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:00,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.65864 samples/s/p 3:22:14 } +2024-07-30 02:45:02,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 794/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 9.921975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:02,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.65947 samples/s/p 3:22:09 } +2024-07-30 02:45:05,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 796/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 9.921366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:05,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.66024 samples/s/p 3:22:05 } +2024-07-30 02:45:08,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 798/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 9.920755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:08,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.65850 samples/s/p 3:22:06 } +2024-07-30 02:45:11,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 800/ 3125], loss: 0.499, per_step_time: 1413ms, lr: 9.920141e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:11,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.65806 samples/s/p 3:22:04 } +2024-07-30 02:45:14,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 802/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 9.919525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:14,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.65916 samples/s/p 3:21:59 } +2024-07-30 02:45:17,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 804/ 3125], loss: 0.189, per_step_time: 1414ms, lr: 9.918906e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:17,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.65648 samples/s/p 3:22:02 } +2024-07-30 02:45:19,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 806/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 9.918285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:19,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.65900 samples/s/p 3:21:53 } +2024-07-30 02:45:22,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 808/ 3125], loss: 0.374, per_step_time: 1414ms, lr: 9.917661e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:22,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.65419 samples/s/p 3:22:01 } +2024-07-30 02:45:25,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 810/ 3125], loss: 0.288, per_step_time: 1421ms, lr: 9.917036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:25,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.62711 samples/s/p 3:22:56 } +2024-07-30 02:45:28,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 812/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 9.916408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:28,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.65850 samples/s/p 3:21:46 } +2024-07-30 02:45:31,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 814/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 9.915778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:31,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.66003 samples/s/p 3:21:40 } +2024-07-30 02:45:34,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 816/ 3125], loss: 0.241, per_step_time: 1417ms, lr: 9.915146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:34,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.64537 samples/s/p 3:22:08 } +2024-07-30 02:45:37,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 818/ 3125], loss: 0.152, per_step_time: 1425ms, lr: 9.91451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:37,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.61247 samples/s/p 3:23:17 } +2024-07-30 02:45:39,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 820/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 9.913872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:39,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.65967 samples/s/p 3:21:32 } +2024-07-30 02:45:42,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 822/ 3125], loss: 0.183, per_step_time: 1418ms, lr: 9.913233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:42,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.64081 samples/s/p 3:22:10 } +2024-07-30 02:45:45,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 824/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 9.912591e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:45,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.66129 samples/s/p 3:21:23 } +2024-07-30 02:45:48,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 826/ 3125], loss: 0.379, per_step_time: 1413ms, lr: 9.911947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:48,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.66045 samples/s/p 3:21:22 } +2024-07-30 02:45:51,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 828/ 3125], loss: 0.211, per_step_time: 1426ms, lr: 9.9112995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:51,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.60824 samples/s/p 3:23:12 } +2024-07-30 02:45:54,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 830/ 3125], loss: 0.451, per_step_time: 1412ms, lr: 9.910651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:54,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.66273 samples/s/p 3:21:11 } +2024-07-30 02:45:56,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 832/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 9.909999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:56,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.65940 samples/s/p 3:21:16 } +2024-07-30 02:45:59,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 834/ 3125], loss: 0.497, per_step_time: 1413ms, lr: 9.909346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:59,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.65921 samples/s/p 3:21:13 } +2024-07-30 02:46:02,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 836/ 3125], loss: 0.101, per_step_time: 1413ms, lr: 9.908689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:02,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.65977 samples/s/p 3:21:09 } +2024-07-30 02:46:05,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 838/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 9.908032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:05,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.66005 samples/s/p 3:21:06 } +2024-07-30 02:46:08,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 840/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 9.90737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:08,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.66109 samples/s/p 3:21:01 } +2024-07-30 02:46:11,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 842/ 3125], loss: 0.334, per_step_time: 1413ms, lr: 9.906707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:11,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.65825 samples/s/p 3:21:04 } +2024-07-30 02:46:13,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 844/ 3125], loss: 0.366, per_step_time: 1414ms, lr: 9.906042e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:13,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.65629 samples/s/p 3:21:05 } +2024-07-30 02:46:16,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 846/ 3125], loss: 0.305, per_step_time: 1416ms, lr: 9.905374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:16,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.64727 samples/s/p 3:21:22 } +2024-07-30 02:46:19,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 848/ 3125], loss: 0.206, per_step_time: 1414ms, lr: 9.904704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:19,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.65666 samples/s/p 3:20:59 } +2024-07-30 02:46:22,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 850/ 3125], loss: 0.367, per_step_time: 1413ms, lr: 9.904032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:22,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.66007 samples/s/p 3:20:49 } +2024-07-30 02:46:25,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 852/ 3125], loss: 0.207, per_step_time: 1414ms, lr: 9.903357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:25,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.65448 samples/s/p 3:20:58 } +2024-07-30 02:46:28,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 854/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 9.902679e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:28,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.66047 samples/s/p 3:20:42 } +2024-07-30 02:46:30,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 856/ 3125], loss: 0.233, per_step_time: 1414ms, lr: 9.902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:30,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.65706 samples/s/p 3:20:47 } +2024-07-30 02:46:33,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 858/ 3125], loss: 0.175, per_step_time: 1416ms, lr: 9.901319e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:33,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.64808 samples/s/p 3:21:03 } +2024-07-30 02:46:36,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 860/ 3125], loss: 0.427, per_step_time: 1414ms, lr: 9.900634e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:36,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.65380 samples/s/p 3:20:48 } +2024-07-30 02:46:39,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 862/ 3125], loss: 0.467, per_step_time: 1413ms, lr: 9.899947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:39,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.66141 samples/s/p 3:20:29 } +2024-07-30 02:46:42,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 864/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 9.899259e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:42,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.65779 samples/s/p 3:20:34 } +2024-07-30 02:46:45,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 866/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 9.8985665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:45,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.66089 samples/s/p 3:20:24 } +2024-07-30 02:46:47,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 868/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 9.8978735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:47,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.65895 samples/s/p 3:20:26 } +2024-07-30 02:46:50,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 870/ 3125], loss: 0.532, per_step_time: 1413ms, lr: 9.897178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:50,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.66063 samples/s/p 3:20:19 } +2024-07-30 02:46:53,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 872/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 9.896479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:53,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.65718 samples/s/p 3:20:24 } +2024-07-30 02:46:56,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 874/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 9.895779e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:56,448 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.66044 samples/s/p 3:20:14 } +2024-07-30 02:46:59,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 876/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 9.895076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:59,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.66093 samples/s/p 3:20:10 } +2024-07-30 02:47:02,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 878/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 9.894371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:02,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.66057 samples/s/p 3:20:08 } +2024-07-30 02:47:04,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 880/ 3125], loss: 0.185, per_step_time: 1414ms, lr: 9.893663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:04,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.65505 samples/s/p 3:20:17 } +2024-07-30 02:47:07,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 882/ 3125], loss: 0.394, per_step_time: 1413ms, lr: 9.892953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:07,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.65956 samples/s/p 3:20:05 } +2024-07-30 02:47:10,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 884/ 3125], loss: 0.114, per_step_time: 1413ms, lr: 9.892241e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:10,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.65851 samples/s/p 3:20:04 } +2024-07-30 02:47:13,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 886/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 9.891526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:13,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.66109 samples/s/p 3:19:56 } +2024-07-30 02:47:16,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 888/ 3125], loss: 0.273, per_step_time: 1415ms, lr: 9.890809e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:16,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.65299 samples/s/p 3:20:10 } +2024-07-30 02:47:19,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 890/ 3125], loss: 0.151, per_step_time: 1412ms, lr: 9.89009e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:19,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.66239 samples/s/p 3:19:47 } +2024-07-30 02:47:21,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 892/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 9.889369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:21,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.65841 samples/s/p 3:19:53 } +2024-07-30 02:47:24,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 894/ 3125], loss: 0.480, per_step_time: 1414ms, lr: 9.888645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:24,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.65700 samples/s/p 3:19:53 } +2024-07-30 02:47:27,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 896/ 3125], loss: 0.519, per_step_time: 1414ms, lr: 9.887918e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:27,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.65601 samples/s/p 3:19:52 } +2024-07-30 02:47:30,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 898/ 3125], loss: 0.440, per_step_time: 1413ms, lr: 9.88719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:30,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.65827 samples/s/p 3:19:45 } +2024-07-30 02:47:33,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 900/ 3125], loss: 0.373, per_step_time: 1412ms, lr: 9.886458e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:33,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.66256 samples/s/p 3:19:33 } +2024-07-30 02:47:36,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 902/ 3125], loss: 0.330, per_step_time: 1413ms, lr: 9.885725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:36,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.65941 samples/s/p 3:19:37 } +2024-07-30 02:47:38,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 904/ 3125], loss: 0.195, per_step_time: 1414ms, lr: 9.8849905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:38,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.65770 samples/s/p 3:19:38 } +2024-07-30 02:47:41,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 906/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 9.884252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:41,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.65772 samples/s/p 3:19:35 } +2024-07-30 02:47:44,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 908/ 3125], loss: 0.134, per_step_time: 1413ms, lr: 9.883512e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:44,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.65840 samples/s/p 3:19:30 } +2024-07-30 02:47:47,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 910/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 9.8827695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:47,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.65904 samples/s/p 3:19:26 } +2024-07-30 02:47:50,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 912/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 9.882025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:50,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.66000 samples/s/p 3:19:21 } +2024-07-30 02:47:53,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 914/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 9.881277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:53,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.65945 samples/s/p 3:19:20 } +2024-07-30 02:47:55,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 916/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 9.8805285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:55,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.66008 samples/s/p 3:19:16 } +2024-07-30 02:47:58,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 918/ 3125], loss: 0.065, per_step_time: 1413ms, lr: 9.879776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:58,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.66022 samples/s/p 3:19:12 } +2024-07-30 02:48:01,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 920/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 9.8790215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:01,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.65842 samples/s/p 3:19:13 } +2024-07-30 02:48:04,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 922/ 3125], loss: 0.426, per_step_time: 1414ms, lr: 9.878265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:04,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.65637 samples/s/p 3:19:15 } +2024-07-30 02:48:07,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 924/ 3125], loss: 0.222, per_step_time: 1415ms, lr: 9.877506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:07,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.65350 samples/s/p 3:19:18 } +2024-07-30 02:48:10,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 926/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 9.876745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:10,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.65882 samples/s/p 3:19:04 } +2024-07-30 02:48:12,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 928/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 9.875981e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:12,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.65889 samples/s/p 3:19:01 } +2024-07-30 02:48:15,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 930/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 9.875215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:15,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.65819 samples/s/p 3:19:00 } +2024-07-30 02:48:18,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 932/ 3125], loss: 0.094, per_step_time: 1413ms, lr: 9.874447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:18,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.66006 samples/s/p 3:18:53 } +2024-07-30 02:48:21,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 934/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 9.873676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:21,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |████ | 5.65533 samples/s/p 3:19:00 } +2024-07-30 02:48:24,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 936/ 3125], loss: 0.248, per_step_time: 1424ms, lr: 9.872903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:24,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |████ | 5.61437 samples/s/p 3:20:24 } +2024-07-30 02:48:27,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 938/ 3125], loss: 0.110, per_step_time: 1413ms, lr: 9.872128e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:27,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.65802 samples/s/p 3:18:49 } +2024-07-30 02:48:30,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 940/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 9.871351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:30,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.65928 samples/s/p 3:18:43 } +2024-07-30 02:48:32,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 942/ 3125], loss: 0.095, per_step_time: 1413ms, lr: 9.8705705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:32,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.66161 samples/s/p 3:18:36 } +2024-07-30 02:48:35,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 944/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 9.869788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:35,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.65885 samples/s/p 3:18:39 } +2024-07-30 02:48:38,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 946/ 3125], loss: 0.311, per_step_time: 1412ms, lr: 9.869004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:38,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.66192 samples/s/p 3:18:29 } +2024-07-30 02:48:41,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 948/ 3125], loss: 0.341, per_step_time: 1413ms, lr: 9.868218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:41,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.65987 samples/s/p 3:18:31 } +2024-07-30 02:48:44,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 950/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 9.867428e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:44,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.66110 samples/s/p 3:18:25 } +2024-07-30 02:48:47,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 952/ 3125], loss: 0.520, per_step_time: 1413ms, lr: 9.866637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:47,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.66001 samples/s/p 3:18:25 } +2024-07-30 02:48:49,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 954/ 3125], loss: 0.370, per_step_time: 1412ms, lr: 9.865843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:49,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.66175 samples/s/p 3:18:18 } +2024-07-30 02:48:52,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 956/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 9.865046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:52,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.65897 samples/s/p 3:18:21 } +2024-07-30 02:48:55,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 958/ 3125], loss: 0.088, per_step_time: 1416ms, lr: 9.864249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:55,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.64598 samples/s/p 3:18:46 } +2024-07-30 02:48:58,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 960/ 3125], loss: 0.254, per_step_time: 1416ms, lr: 9.863448e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:58,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.64845 samples/s/p 3:18:38 } +2024-07-30 02:49:01,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 962/ 3125], loss: 0.118, per_step_time: 1421ms, lr: 9.862644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:01,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.62640 samples/s/p 3:19:22 } +2024-07-30 02:49:04,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 964/ 3125], loss: 0.348, per_step_time: 1414ms, lr: 9.861839e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:04,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.65768 samples/s/p 3:18:13 } +2024-07-30 02:49:06,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 966/ 3125], loss: 0.515, per_step_time: 1413ms, lr: 9.861032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:06,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.65853 samples/s/p 3:18:08 } +2024-07-30 02:49:09,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 968/ 3125], loss: 0.405, per_step_time: 1415ms, lr: 9.860221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:09,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.65033 samples/s/p 3:18:23 } +2024-07-30 02:49:12,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 970/ 3125], loss: 0.535, per_step_time: 1413ms, lr: 9.859409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:12,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.65890 samples/s/p 3:18:02 } +2024-07-30 02:49:15,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 972/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 9.858593e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:15,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.65913 samples/s/p 3:17:58 } +2024-07-30 02:49:18,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 974/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 9.8577775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:18,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.65953 samples/s/p 3:17:55 } +2024-07-30 02:49:21,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 976/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 9.856958e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:21,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.66049 samples/s/p 3:17:50 } +2024-07-30 02:49:23,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 978/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 9.856137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:23,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.66055 samples/s/p 3:17:47 } +2024-07-30 02:49:26,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 980/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 9.855313e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:26,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.66056 samples/s/p 3:17:44 } +2024-07-30 02:49:29,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 982/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 9.854486e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:29,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.65865 samples/s/p 3:17:45 } +2024-07-30 02:49:32,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 984/ 3125], loss: 0.367, per_step_time: 1413ms, lr: 9.8536575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:32,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.65850 samples/s/p 3:17:43 } +2024-07-30 02:49:35,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 986/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 9.852827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:35,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.66052 samples/s/p 3:17:36 } +2024-07-30 02:49:38,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 988/ 3125], loss: 0.293, per_step_time: 1413ms, lr: 9.851993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:38,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.66021 samples/s/p 3:17:33 } +2024-07-30 02:49:40,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 990/ 3125], loss: 0.241, per_step_time: 1414ms, lr: 9.851158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:40,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.65679 samples/s/p 3:17:38 } +2024-07-30 02:49:43,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 992/ 3125], loss: 0.267, per_step_time: 1416ms, lr: 9.85032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:43,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.64629 samples/s/p 3:17:57 } +2024-07-30 02:49:46,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 994/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 9.849479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:46,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.65870 samples/s/p 3:17:28 } +2024-07-30 02:49:49,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 996/ 3125], loss: 0.733, per_step_time: 1414ms, lr: 9.848637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:49,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.65622 samples/s/p 3:17:31 } +2024-07-30 02:49:52,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 998/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 9.847792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:52,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.65579 samples/s/p 3:17:29 } +2024-07-30 02:49:55,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1000/ 3125], loss: 0.555, per_step_time: 1414ms, lr: 9.846945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:55,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.65697 samples/s/p 3:17:23 } +2024-07-30 02:49:57,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1002/ 3125], loss: 0.196, per_step_time: 1415ms, lr: 9.846096e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:57,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.65248 samples/s/p 3:17:30 } +2024-07-30 02:50:00,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1004/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 9.845244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:00,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.65783 samples/s/p 3:17:16 } +2024-07-30 02:50:03,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1006/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 9.84439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:03,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.65752 samples/s/p 3:17:14 } +2024-07-30 02:50:06,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1008/ 3125], loss: 0.251, per_step_time: 1414ms, lr: 9.843533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:06,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.65407 samples/s/p 3:17:18 } +2024-07-30 02:50:09,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1010/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 9.842675e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:09,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.65837 samples/s/p 3:17:06 } +2024-07-30 02:50:12,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1012/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 9.841814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:12,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.65927 samples/s/p 3:17:02 } +2024-07-30 02:50:14,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1014/ 3125], loss: 0.384, per_step_time: 1412ms, lr: 9.840951e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:14,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.66219 samples/s/p 3:16:53 } +2024-07-30 02:50:17,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1016/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 9.840085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:17,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.65907 samples/s/p 3:16:56 } +2024-07-30 02:50:20,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1018/ 3125], loss: 0.232, per_step_time: 1414ms, lr: 9.839217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:20,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.65712 samples/s/p 3:16:58 } +2024-07-30 02:50:23,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1020/ 3125], loss: 0.114, per_step_time: 1413ms, lr: 9.838346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:23,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.65980 samples/s/p 3:16:49 } +2024-07-30 02:50:26,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1022/ 3125], loss: 0.533, per_step_time: 1417ms, lr: 9.837474e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:26,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.64536 samples/s/p 3:17:16 } +2024-07-30 02:50:29,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1024/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 9.836599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:29,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.65940 samples/s/p 3:16:44 } +2024-07-30 02:50:31,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1026/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 9.835722e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:31,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.66149 samples/s/p 3:16:37 } +2024-07-30 02:50:34,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1028/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 9.834843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:34,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.65942 samples/s/p 3:16:39 } +2024-07-30 02:50:37,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1030/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 9.833961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:37,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.66089 samples/s/p 3:16:33 } +2024-07-30 02:50:40,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1032/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 9.833077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:40,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.65925 samples/s/p 3:16:33 } +2024-07-30 02:50:43,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1034/ 3125], loss: 0.209, per_step_time: 1412ms, lr: 9.83219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:43,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.66183 samples/s/p 3:16:25 } +2024-07-30 02:50:46,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1036/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 9.831302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:46,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.66047 samples/s/p 3:16:25 } +2024-07-30 02:50:48,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1038/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 9.83041e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:48,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.66069 samples/s/p 3:16:22 } +2024-07-30 02:50:51,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1040/ 3125], loss: 0.089, per_step_time: 1413ms, lr: 9.829518e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:51,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.66058 samples/s/p 3:16:19 } +2024-07-30 02:50:54,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1042/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 9.828622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:54,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.66019 samples/s/p 3:16:17 } +2024-07-30 02:50:57,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1044/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 9.827724e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:57,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.65928 samples/s/p 3:16:16 } +2024-07-30 02:51:00,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1046/ 3125], loss: 0.345, per_step_time: 1414ms, lr: 9.826823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:00,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.65724 samples/s/p 3:16:18 } +2024-07-30 02:51:03,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1048/ 3125], loss: 0.387, per_step_time: 1414ms, lr: 9.825921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:03,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.65762 samples/s/p 3:16:14 } +2024-07-30 02:51:05,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1050/ 3125], loss: 0.237, per_step_time: 1414ms, lr: 9.825016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:05,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.65588 samples/s/p 3:16:15 } +2024-07-30 02:51:08,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1052/ 3125], loss: 0.115, per_step_time: 1413ms, lr: 9.824109e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:08,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.65949 samples/s/p 3:16:05 } +2024-07-30 02:51:11,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1054/ 3125], loss: 0.151, per_step_time: 1414ms, lr: 9.8231985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:11,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.65688 samples/s/p 3:16:07 } +2024-07-30 02:51:14,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1056/ 3125], loss: 0.353, per_step_time: 1413ms, lr: 9.822287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:14,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.65916 samples/s/p 3:16:00 } +2024-07-30 02:51:17,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1058/ 3125], loss: 0.219, per_step_time: 1416ms, lr: 9.821373e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:17,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.64678 samples/s/p 3:16:23 } +2024-07-30 02:51:20,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1060/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 9.820457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:20,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.65974 samples/s/p 3:15:53 } +2024-07-30 02:51:22,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1062/ 3125], loss: 0.295, per_step_time: 1415ms, lr: 9.819539e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:22,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.65248 samples/s/p 3:16:05 } +2024-07-30 02:51:25,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1064/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 9.8186165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:25,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.66107 samples/s/p 3:15:44 } +2024-07-30 02:51:28,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1066/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 9.817693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:28,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.65953 samples/s/p 3:15:45 } +2024-07-30 02:51:31,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1068/ 3125], loss: 0.271, per_step_time: 1412ms, lr: 9.8167675e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:31,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.66173 samples/s/p 3:15:37 } +2024-07-30 02:51:34,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1070/ 3125], loss: 0.564, per_step_time: 1413ms, lr: 9.815841e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:34,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.65864 samples/s/p 3:15:41 } +2024-07-30 02:51:37,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1072/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 9.81491e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:37,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.66120 samples/s/p 3:15:33 } +2024-07-30 02:51:39,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1074/ 3125], loss: 0.383, per_step_time: 1414ms, lr: 9.813978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:39,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.65606 samples/s/p 3:15:41 } +2024-07-30 02:51:42,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1076/ 3125], loss: 0.429, per_step_time: 1413ms, lr: 9.813043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:42,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.65959 samples/s/p 3:15:30 } +2024-07-30 02:51:45,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1078/ 3125], loss: 0.408, per_step_time: 1413ms, lr: 9.812105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:45,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.66148 samples/s/p 3:15:24 } +2024-07-30 02:51:48,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1080/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 9.811166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:48,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.66117 samples/s/p 3:15:21 } +2024-07-30 02:51:51,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1082/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 9.810225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:51,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.65890 samples/s/p 3:15:23 } +2024-07-30 02:51:54,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1084/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 9.8092805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:54,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.65981 samples/s/p 3:15:19 } +2024-07-30 02:51:56,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1086/ 3125], loss: 0.335, per_step_time: 1412ms, lr: 9.808335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:56,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.66189 samples/s/p 3:15:11 } +2024-07-30 02:51:59,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1088/ 3125], loss: 0.302, per_step_time: 1416ms, lr: 9.807386e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:59,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.64869 samples/s/p 3:15:36 } +2024-07-30 02:52:02,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1090/ 3125], loss: 0.307, per_step_time: 1415ms, lr: 9.806435e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:02,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.65087 samples/s/p 3:15:29 } +2024-07-30 02:52:05,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1092/ 3125], loss: 0.224, per_step_time: 1415ms, lr: 9.8054825e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:05,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.65064 samples/s/p 3:15:26 } +2024-07-30 02:52:08,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1094/ 3125], loss: 0.178, per_step_time: 1415ms, lr: 9.804527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:08,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.65344 samples/s/p 3:15:18 } +2024-07-30 02:52:11,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1096/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 9.803569e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:11,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.65820 samples/s/p 3:15:05 } +2024-07-30 02:52:13,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1098/ 3125], loss: 0.200, per_step_time: 1414ms, lr: 9.8026085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:13,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.65652 samples/s/p 3:15:06 } +2024-07-30 02:52:16,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1100/ 3125], loss: 0.426, per_step_time: 1414ms, lr: 9.801647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:16,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.65663 samples/s/p 3:15:03 } +2024-07-30 02:52:19,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1102/ 3125], loss: 0.628, per_step_time: 1413ms, lr: 9.800682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:19,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.65849 samples/s/p 3:14:56 } +2024-07-30 02:52:22,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1104/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 9.799715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:22,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.66088 samples/s/p 3:14:48 } +2024-07-30 02:52:25,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1106/ 3125], loss: 0.322, per_step_time: 1413ms, lr: 9.798746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:25,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.66081 samples/s/p 3:14:45 } +2024-07-30 02:52:28,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1108/ 3125], loss: 0.553, per_step_time: 1413ms, lr: 9.7977745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:28,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.65959 samples/s/p 3:14:45 } +2024-07-30 02:52:30,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1110/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 9.7968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:30,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.66056 samples/s/p 3:14:40 } +2024-07-30 02:52:33,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1112/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 9.795824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:33,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.65973 samples/s/p 3:14:39 } +2024-07-30 02:52:36,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1114/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 9.794847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:36,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.66050 samples/s/p 3:14:35 } +2024-07-30 02:52:39,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1116/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 9.7938655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:39,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.65908 samples/s/p 3:14:35 } +2024-07-30 02:52:42,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1118/ 3125], loss: 0.401, per_step_time: 1413ms, lr: 9.792882e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:42,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.66081 samples/s/p 3:14:29 } +2024-07-30 02:52:45,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1120/ 3125], loss: 0.297, per_step_time: 1412ms, lr: 9.791896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:45,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.66196 samples/s/p 3:14:23 } +2024-07-30 02:52:47,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1122/ 3125], loss: 0.198, per_step_time: 1414ms, lr: 9.790909e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:47,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |█████ | 5.65713 samples/s/p 3:14:30 } +2024-07-30 02:52:50,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1124/ 3125], loss: 0.094, per_step_time: 1416ms, lr: 9.789919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:50,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |█████ | 5.64782 samples/s/p 3:14:47 } +2024-07-30 02:52:53,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1126/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 9.788928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:53,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.65848 samples/s/p 3:14:22 } +2024-07-30 02:52:56,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1128/ 3125], loss: 0.300, per_step_time: 1417ms, lr: 9.787934e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:56,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.64564 samples/s/p 3:14:46 } +2024-07-30 02:52:59,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1130/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 9.786936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:59,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.66019 samples/s/p 3:14:13 } +2024-07-30 02:53:02,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1132/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 9.785938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:02,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.65822 samples/s/p 3:14:14 } +2024-07-30 02:53:05,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1134/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 9.784937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:05,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.65972 samples/s/p 3:14:08 } +2024-07-30 02:53:07,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1136/ 3125], loss: 0.150, per_step_time: 1412ms, lr: 9.783933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:07,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.66173 samples/s/p 3:14:01 } +2024-07-30 02:53:10,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1138/ 3125], loss: 0.158, per_step_time: 1414ms, lr: 9.782927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:10,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.65534 samples/s/p 3:14:11 } +2024-07-30 02:53:13,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1140/ 3125], loss: 0.321, per_step_time: 1413ms, lr: 9.781919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:13,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.65955 samples/s/p 3:14:00 } +2024-07-30 02:53:16,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1142/ 3125], loss: 0.248, per_step_time: 1414ms, lr: 9.780909e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:16,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.65707 samples/s/p 3:14:02 } +2024-07-30 02:53:19,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1144/ 3125], loss: 0.359, per_step_time: 1415ms, lr: 9.779896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:19,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.65262 samples/s/p 3:14:09 } +2024-07-30 02:53:22,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1146/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 9.778881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:22,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.65881 samples/s/p 3:13:53 } +2024-07-30 02:53:24,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1148/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 9.777864e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:24,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.65912 samples/s/p 3:13:50 } +2024-07-30 02:53:27,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1150/ 3125], loss: 0.211, per_step_time: 1414ms, lr: 9.776844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:27,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.65664 samples/s/p 3:13:52 } +2024-07-30 02:53:30,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1152/ 3125], loss: 0.408, per_step_time: 1413ms, lr: 9.775823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:30,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.65951 samples/s/p 3:13:43 } +2024-07-30 02:53:33,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1154/ 3125], loss: 0.170, per_step_time: 1414ms, lr: 9.774798e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:33,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.65682 samples/s/p 3:13:46 } +2024-07-30 02:53:36,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1156/ 3125], loss: 0.331, per_step_time: 1414ms, lr: 9.773771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:36,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.65770 samples/s/p 3:13:41 } +2024-07-30 02:53:39,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1158/ 3125], loss: 0.134, per_step_time: 1413ms, lr: 9.772743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:39,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.66083 samples/s/p 3:13:32 } +2024-07-30 02:53:41,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1160/ 3125], loss: 0.465, per_step_time: 1413ms, lr: 9.771713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:41,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.66104 samples/s/p 3:13:29 } +2024-07-30 02:53:44,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1162/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 9.770679e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:44,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.65958 samples/s/p 3:13:29 } +2024-07-30 02:53:47,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1164/ 3125], loss: 0.082, per_step_time: 1413ms, lr: 9.769644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:47,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.65788 samples/s/p 3:13:30 } +2024-07-30 02:53:50,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1166/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 9.768606e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:50,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.66152 samples/s/p 3:13:19 } +2024-07-30 02:53:53,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1168/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 9.767566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:53,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.65976 samples/s/p 3:13:20 } +2024-07-30 02:53:56,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1170/ 3125], loss: 0.246, per_step_time: 1412ms, lr: 9.766523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:56,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.66174 samples/s/p 3:13:13 } +2024-07-30 02:53:58,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1172/ 3125], loss: 0.307, per_step_time: 1415ms, lr: 9.765479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:58,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.65083 samples/s/p 3:13:33 } +2024-07-30 02:54:01,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1174/ 3125], loss: 0.124, per_step_time: 1414ms, lr: 9.764432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:01,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.65738 samples/s/p 3:13:16 } +2024-07-30 02:54:04,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1176/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 9.763384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:04,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.65942 samples/s/p 3:13:09 } +2024-07-30 02:54:07,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1178/ 3125], loss: 0.391, per_step_time: 1414ms, lr: 9.762332e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:07,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.65399 samples/s/p 3:13:18 } +2024-07-30 02:54:10,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1180/ 3125], loss: 0.177, per_step_time: 1414ms, lr: 9.761278e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:10,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.65687 samples/s/p 3:13:09 } +2024-07-30 02:54:13,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1182/ 3125], loss: 0.174, per_step_time: 1414ms, lr: 9.760222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:13,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.65705 samples/s/p 3:13:06 } +2024-07-30 02:54:15,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1184/ 3125], loss: 0.159, per_step_time: 1414ms, lr: 9.759164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:15,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.65628 samples/s/p 3:13:05 } +2024-07-30 02:54:18,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1186/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 9.758104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:18,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.65886 samples/s/p 3:12:56 } +2024-07-30 02:54:21,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1188/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 9.75704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:21,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.66008 samples/s/p 3:12:51 } +2024-07-30 02:54:24,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1190/ 3125], loss: 0.580, per_step_time: 1413ms, lr: 9.755976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:24,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.66111 samples/s/p 3:12:46 } +2024-07-30 02:54:27,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1192/ 3125], loss: 0.446, per_step_time: 1413ms, lr: 9.754908e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:27,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.65916 samples/s/p 3:12:47 } +2024-07-30 02:54:30,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1194/ 3125], loss: 0.293, per_step_time: 1413ms, lr: 9.75384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:30,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.66055 samples/s/p 3:12:42 } +2024-07-30 02:54:32,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1196/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 9.752767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:32,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.66043 samples/s/p 3:12:39 } +2024-07-30 02:54:35,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1198/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 9.751693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:35,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.65852 samples/s/p 3:12:40 } +2024-07-30 02:54:38,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1200/ 3125], loss: 0.244, per_step_time: 1414ms, lr: 9.750616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:38,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.65741 samples/s/p 3:12:40 } +2024-07-30 02:54:41,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1202/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 9.749538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:41,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.65925 samples/s/p 3:12:33 } +2024-07-30 02:54:44,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1204/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 9.748457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:44,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.66057 samples/s/p 3:12:27 } +2024-07-30 02:54:47,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1206/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 9.747374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:47,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.65941 samples/s/p 3:12:27 } +2024-07-30 02:54:49,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1208/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 9.746288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:49,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.65954 samples/s/p 3:12:24 } +2024-07-30 02:54:52,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1210/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 9.7452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:52,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.66051 samples/s/p 3:12:19 } +2024-07-30 02:54:55,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1212/ 3125], loss: 0.112, per_step_time: 1414ms, lr: 9.744111e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:55,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.65761 samples/s/p 3:12:22 } +2024-07-30 02:54:58,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1214/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 9.7430175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:58,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.66033 samples/s/p 3:12:14 } +2024-07-30 02:55:01,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1216/ 3125], loss: 0.415, per_step_time: 1413ms, lr: 9.741923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:01,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.66073 samples/s/p 3:12:10 } +2024-07-30 02:55:04,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1218/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 9.7408265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:04,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.65942 samples/s/p 3:12:10 } +2024-07-30 02:55:06,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1220/ 3125], loss: 0.406, per_step_time: 1417ms, lr: 9.739729e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:06,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.64207 samples/s/p 3:12:43 } +2024-07-30 02:55:09,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1222/ 3125], loss: 0.280, per_step_time: 1416ms, lr: 9.738626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:09,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.64781 samples/s/p 3:12:28 } +2024-07-30 02:55:12,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1224/ 3125], loss: 0.308, per_step_time: 1427ms, lr: 9.737523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:12,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.60551 samples/s/p 3:13:52 } +2024-07-30 02:55:15,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1226/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 9.736417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:15,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.66074 samples/s/p 3:11:56 } +2024-07-30 02:55:18,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1228/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 9.7353095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:18,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.66031 samples/s/p 3:11:54 } +2024-07-30 02:55:21,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1230/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 9.734199e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:21,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.66027 samples/s/p 3:11:51 } +2024-07-30 02:55:23,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1232/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 9.733087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:23,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.65809 samples/s/p 3:11:53 } +2024-07-30 02:55:26,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1234/ 3125], loss: 0.403, per_step_time: 1414ms, lr: 9.731971e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:26,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.65692 samples/s/p 3:11:52 } +2024-07-30 02:55:29,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1236/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 9.730855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:29,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.65926 samples/s/p 3:11:45 } +2024-07-30 02:55:32,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1238/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 9.729735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:32,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.66057 samples/s/p 3:11:39 } +2024-07-30 02:55:35,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1240/ 3125], loss: 0.144, per_step_time: 1412ms, lr: 9.728614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:35,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.66203 samples/s/p 3:11:34 } +2024-07-30 02:55:38,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1242/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 9.727489e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:38,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.65981 samples/s/p 3:11:35 } +2024-07-30 02:55:40,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1244/ 3125], loss: 0.158, per_step_time: 1413ms, lr: 9.726363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:40,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.66082 samples/s/p 3:11:30 } +2024-07-30 02:55:43,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1246/ 3125], loss: 0.466, per_step_time: 1414ms, lr: 9.725235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:43,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.65685 samples/s/p 3:11:36 } +2024-07-30 02:55:46,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1248/ 3125], loss: 0.301, per_step_time: 1414ms, lr: 9.7241045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:46,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.65748 samples/s/p 3:11:32 } +2024-07-30 02:55:49,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1250/ 3125], loss: 0.301, per_step_time: 1414ms, lr: 9.722971e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:49,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.65711 samples/s/p 3:11:29 } +2024-07-30 02:55:52,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1252/ 3125], loss: 0.246, per_step_time: 1415ms, lr: 9.721835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:52,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.65223 samples/s/p 3:11:37 } +2024-07-30 02:55:55,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1254/ 3125], loss: 0.269, per_step_time: 1414ms, lr: 9.7206985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:55,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.65724 samples/s/p 3:11:24 } +2024-07-30 02:55:57,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1256/ 3125], loss: 0.186, per_step_time: 1412ms, lr: 9.719559e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:57,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.66226 samples/s/p 3:11:11 } +2024-07-30 02:56:00,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1258/ 3125], loss: 0.373, per_step_time: 1413ms, lr: 9.718417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:00,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.66007 samples/s/p 3:11:12 } +2024-07-30 02:56:03,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1260/ 3125], loss: 0.267, per_step_time: 1412ms, lr: 9.717272e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:03,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.66180 samples/s/p 3:11:06 } +2024-07-30 02:56:06,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1262/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 9.716126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:06,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.66095 samples/s/p 3:11:05 } +2024-07-30 02:56:09,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1264/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 9.714978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:09,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.66056 samples/s/p 3:11:03 } +2024-07-30 02:56:12,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1266/ 3125], loss: 0.501, per_step_time: 1413ms, lr: 9.713827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:12,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.65929 samples/s/p 3:11:02 } +2024-07-30 02:56:14,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1268/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 9.712674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:14,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.65864 samples/s/p 3:11:01 } +2024-07-30 02:56:17,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1270/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 9.711518e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:17,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.65937 samples/s/p 3:10:57 } +2024-07-30 02:56:20,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1272/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 9.71036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:20,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.65902 samples/s/p 3:10:54 } +2024-07-30 02:56:23,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1274/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 9.709201e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:23,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.65812 samples/s/p 3:10:53 } +2024-07-30 02:56:26,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1276/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 9.708038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:26,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.65953 samples/s/p 3:10:48 } +2024-07-30 02:56:29,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1278/ 3125], loss: 0.248, per_step_time: 1414ms, lr: 9.706873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:29,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.65728 samples/s/p 3:10:50 } +2024-07-30 02:56:31,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1280/ 3125], loss: 0.137, per_step_time: 1414ms, lr: 9.705706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:31,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.65727 samples/s/p 3:10:47 } +2024-07-30 02:56:34,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1282/ 3125], loss: 0.208, per_step_time: 1415ms, lr: 9.704539e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:34,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.65253 samples/s/p 3:10:53 } +2024-07-30 02:56:37,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1284/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 9.703367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:37,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.65616 samples/s/p 3:10:43 } +2024-07-30 02:56:40,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1286/ 3125], loss: 0.480, per_step_time: 1413ms, lr: 9.702194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:40,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.66025 samples/s/p 3:10:32 } +2024-07-30 02:56:43,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1288/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 9.701018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:43,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.66128 samples/s/p 3:10:27 } +2024-07-30 02:56:46,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1290/ 3125], loss: 0.396, per_step_time: 1413ms, lr: 9.69984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:46,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.66153 samples/s/p 3:10:24 } +2024-07-30 02:56:48,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1292/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 9.6986605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:48,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.65971 samples/s/p 3:10:25 } +2024-07-30 02:56:51,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1294/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 9.697477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:51,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.65961 samples/s/p 3:10:22 } +2024-07-30 02:56:54,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1296/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 9.696292e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:54,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.66085 samples/s/p 3:10:17 } +2024-07-30 02:56:57,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1298/ 3125], loss: 0.426, per_step_time: 1414ms, lr: 9.695105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:57,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.65468 samples/s/p 3:10:26 } +2024-07-30 02:57:00,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1300/ 3125], loss: 0.553, per_step_time: 1414ms, lr: 9.693917e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:00,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.65625 samples/s/p 3:10:20 } +2024-07-30 02:57:03,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1302/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 9.692725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:03,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.66089 samples/s/p 3:10:08 } +2024-07-30 02:57:05,991 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1304/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 9.691531e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:05,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.66137 samples/s/p 3:10:05 } +2024-07-30 02:57:08,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1306/ 3125], loss: 0.382, per_step_time: 1413ms, lr: 9.690336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:08,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.66057 samples/s/p 3:10:03 } +2024-07-30 02:57:11,660 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1308/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 9.689138e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:11,660 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.65791 samples/s/p 3:10:06 } +2024-07-30 02:57:14,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1310/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 9.687938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:14,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.66035 samples/s/p 3:09:58 } +2024-07-30 02:57:17,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1312/ 3125], loss: 0.122, per_step_time: 1413ms, lr: 9.686734e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:17,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.66050 samples/s/p 3:09:55 } +2024-07-30 02:57:20,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1314/ 3125], loss: 0.244, per_step_time: 1414ms, lr: 9.685529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:20,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |███████ | 5.65770 samples/s/p 3:09:58 } +2024-07-30 02:57:22,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1316/ 3125], loss: 0.242, per_step_time: 1414ms, lr: 9.684323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:22,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |███████ | 5.65534 samples/s/p 3:10:00 } +2024-07-30 02:57:25,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1318/ 3125], loss: 0.170, per_step_time: 1412ms, lr: 9.683114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:25,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.66176 samples/s/p 3:09:44 } +2024-07-30 02:57:28,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1320/ 3125], loss: 0.338, per_step_time: 1414ms, lr: 9.681902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:28,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.65757 samples/s/p 3:09:50 } +2024-07-30 02:57:31,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1322/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 9.680688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:31,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.65954 samples/s/p 3:09:43 } +2024-07-30 02:57:34,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1324/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 9.679472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:34,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.66104 samples/s/p 3:09:37 } +2024-07-30 02:57:37,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1326/ 3125], loss: 0.458, per_step_time: 1413ms, lr: 9.678254e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:37,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.66071 samples/s/p 3:09:35 } +2024-07-30 02:57:40,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1328/ 3125], loss: 0.322, per_step_time: 1414ms, lr: 9.677034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:40,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.65638 samples/s/p 3:09:41 } +2024-07-30 02:57:42,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1330/ 3125], loss: 0.384, per_step_time: 1413ms, lr: 9.67581e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:42,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.65852 samples/s/p 3:09:33 } +2024-07-30 02:57:45,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1332/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 9.674586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:45,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.66030 samples/s/p 3:09:27 } +2024-07-30 02:57:48,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1334/ 3125], loss: 0.160, per_step_time: 1413ms, lr: 9.673359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:48,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.65836 samples/s/p 3:09:28 } +2024-07-30 02:57:51,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1336/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 9.67213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:51,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.65507 samples/s/p 3:09:32 } +2024-07-30 02:57:54,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1338/ 3125], loss: 0.599, per_step_time: 1413ms, lr: 9.670897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:54,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.66048 samples/s/p 3:09:18 } +2024-07-30 02:57:57,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1340/ 3125], loss: 0.408, per_step_time: 1415ms, lr: 9.669664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:57,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.65370 samples/s/p 3:09:29 } +2024-07-30 02:57:59,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1342/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 9.668427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:59,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.66100 samples/s/p 3:09:12 } +2024-07-30 02:58:02,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1344/ 3125], loss: 0.351, per_step_time: 1414ms, lr: 9.667189e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:02,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.65737 samples/s/p 3:09:16 } +2024-07-30 02:58:05,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1346/ 3125], loss: 0.354, per_step_time: 1412ms, lr: 9.665949e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:05,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.66210 samples/s/p 3:09:04 } +2024-07-30 02:58:08,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1348/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 9.664705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:08,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.66076 samples/s/p 3:09:04 } +2024-07-30 02:58:11,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1350/ 3125], loss: 0.249, per_step_time: 1412ms, lr: 9.663461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:11,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.66466 samples/s/p 3:08:53 } +2024-07-30 02:58:14,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1352/ 3125], loss: 0.442, per_step_time: 1413ms, lr: 9.662214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:14,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.65935 samples/s/p 3:09:01 } +2024-07-30 02:58:16,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1354/ 3125], loss: 0.305, per_step_time: 1412ms, lr: 9.660965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:16,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.66190 samples/s/p 3:08:53 } +2024-07-30 02:58:19,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1356/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 9.659713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:19,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.65939 samples/s/p 3:08:55 } +2024-07-30 02:58:22,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1358/ 3125], loss: 0.118, per_step_time: 1413ms, lr: 9.658459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:22,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.66087 samples/s/p 3:08:49 } +2024-07-30 02:58:25,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1360/ 3125], loss: 0.098, per_step_time: 1425ms, lr: 9.657203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:25,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.61344 samples/s/p 3:10:22 } +2024-07-30 02:58:28,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1362/ 3125], loss: 0.471, per_step_time: 1413ms, lr: 9.655945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:28,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.65977 samples/s/p 3:08:46 } +2024-07-30 02:58:31,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1364/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 9.654684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:31,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.65974 samples/s/p 3:08:43 } +2024-07-30 02:58:33,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1366/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 9.65342e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:33,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.65887 samples/s/p 3:08:42 } +2024-07-30 02:58:36,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1368/ 3125], loss: 0.169, per_step_time: 1413ms, lr: 9.652156e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:36,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.65978 samples/s/p 3:08:37 } +2024-07-30 02:58:39,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1370/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 9.650888e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:39,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.65940 samples/s/p 3:08:35 } +2024-07-30 02:58:42,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1372/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 9.64962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:42,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.66131 samples/s/p 3:08:29 } +2024-07-30 02:58:45,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1374/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 9.648348e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:45,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.66132 samples/s/p 3:08:26 } +2024-07-30 02:58:48,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1376/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 9.647073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:48,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.66137 samples/s/p 3:08:23 } +2024-07-30 02:58:50,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1378/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 9.645798e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:50,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.65805 samples/s/p 3:08:27 } +2024-07-30 02:58:53,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1380/ 3125], loss: 0.612, per_step_time: 1413ms, lr: 9.64452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:53,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.65998 samples/s/p 3:08:20 } +2024-07-30 02:58:56,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1382/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 9.643239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:56,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.65895 samples/s/p 3:08:19 } +2024-07-30 02:58:59,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1384/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 9.641956e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:59,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.65872 samples/s/p 3:08:17 } +2024-07-30 02:59:02,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1386/ 3125], loss: 0.271, per_step_time: 1415ms, lr: 9.640671e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:02,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.65278 samples/s/p 3:08:26 } +2024-07-30 02:59:05,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1388/ 3125], loss: 0.386, per_step_time: 1414ms, lr: 9.639384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:05,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.65689 samples/s/p 3:08:15 } +2024-07-30 02:59:07,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1390/ 3125], loss: 0.425, per_step_time: 1413ms, lr: 9.6380945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:07,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.66081 samples/s/p 3:08:04 } +2024-07-30 02:59:10,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1392/ 3125], loss: 0.252, per_step_time: 1416ms, lr: 9.636802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:10,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.64736 samples/s/p 3:08:28 } +2024-07-30 02:59:13,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1394/ 3125], loss: 0.226, per_step_time: 1414ms, lr: 9.635509e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:13,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.65666 samples/s/p 3:08:07 } +2024-07-30 02:59:16,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1396/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 9.634213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:16,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.66149 samples/s/p 3:07:54 } +2024-07-30 02:59:19,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1398/ 3125], loss: 0.431, per_step_time: 1413ms, lr: 9.632915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:19,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.66031 samples/s/p 3:07:54 } +2024-07-30 02:59:22,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1400/ 3125], loss: 0.280, per_step_time: 1414ms, lr: 9.6316135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:22,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.65705 samples/s/p 3:07:57 } +2024-07-30 02:59:22,059 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 02:59:56,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1402/ 3125], loss: 0.537, per_step_time: 1414ms, lr: 9.630311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:56,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.65550 samples/s/p 3:07:58 } +2024-07-30 02:59:59,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1404/ 3125], loss: 0.321, per_step_time: 1413ms, lr: 9.629006e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:59,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.65800 samples/s/p 3:07:50 } +2024-07-30 03:00:02,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1406/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 9.6277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:02,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.65964 samples/s/p 3:07:44 } +2024-07-30 03:00:05,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1408/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 9.62639e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:05,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.65928 samples/s/p 3:07:42 } +2024-07-30 03:00:08,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1410/ 3125], loss: 0.320, per_step_time: 1414ms, lr: 9.625078e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:08,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.65430 samples/s/p 3:07:49 } +2024-07-30 03:00:11,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1412/ 3125], loss: 0.263, per_step_time: 1415ms, lr: 9.6237645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:11,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.65099 samples/s/p 3:07:53 } +2024-07-30 03:00:14,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1414/ 3125], loss: 0.153, per_step_time: 1414ms, lr: 9.6224485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:14,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.65682 samples/s/p 3:07:38 } +2024-07-30 03:00:17,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1416/ 3125], loss: 0.109, per_step_time: 1413ms, lr: 9.621131e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:17,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.65994 samples/s/p 3:07:29 } +2024-07-30 03:00:19,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1418/ 3125], loss: 0.217, per_step_time: 1412ms, lr: 9.61981e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:19,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.66251 samples/s/p 3:07:21 } +2024-07-30 03:00:22,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1420/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 9.618488e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:22,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.66072 samples/s/p 3:07:22 } +2024-07-30 03:00:25,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1422/ 3125], loss: 0.702, per_step_time: 1413ms, lr: 9.617163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:25,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.66093 samples/s/p 3:07:19 } +2024-07-30 03:00:28,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1424/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 9.615836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:28,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.65891 samples/s/p 3:07:20 } +2024-07-30 03:00:31,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1426/ 3125], loss: 0.307, per_step_time: 1414ms, lr: 9.614508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:31,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.65672 samples/s/p 3:07:21 } +2024-07-30 03:00:34,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1428/ 3125], loss: 0.406, per_step_time: 1413ms, lr: 9.613175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:34,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.65990 samples/s/p 3:07:12 } +2024-07-30 03:00:36,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1430/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 9.611842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:36,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.66165 samples/s/p 3:07:06 } +2024-07-30 03:00:39,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1432/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 9.610506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:39,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.65918 samples/s/p 3:07:08 } +2024-07-30 03:00:42,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1434/ 3125], loss: 0.264, per_step_time: 1416ms, lr: 9.609167e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:42,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.64885 samples/s/p 3:07:26 } +2024-07-30 03:00:45,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1436/ 3125], loss: 0.493, per_step_time: 1413ms, lr: 9.607828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:45,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.65994 samples/s/p 3:07:01 } +2024-07-30 03:00:48,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1438/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 9.606485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:48,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.66079 samples/s/p 3:06:56 } +2024-07-30 03:00:51,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1440/ 3125], loss: 0.302, per_step_time: 1412ms, lr: 9.605141e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:51,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.66206 samples/s/p 3:06:51 } +2024-07-30 03:00:53,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1442/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 9.603795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:53,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.65972 samples/s/p 3:06:53 } +2024-07-30 03:00:56,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1444/ 3125], loss: 0.148, per_step_time: 1417ms, lr: 9.602445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:56,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.64181 samples/s/p 3:07:26 } +2024-07-30 03:00:59,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1446/ 3125], loss: 0.254, per_step_time: 1416ms, lr: 9.601094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:59,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.64863 samples/s/p 3:07:09 } +2024-07-30 03:01:02,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1448/ 3125], loss: 0.198, per_step_time: 1416ms, lr: 9.599741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:02,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.64842 samples/s/p 3:07:07 } +2024-07-30 03:01:05,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1450/ 3125], loss: 0.306, per_step_time: 1419ms, lr: 9.598385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:05,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.63537 samples/s/p 3:07:30 } +2024-07-30 03:01:08,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1452/ 3125], loss: 0.187, per_step_time: 1421ms, lr: 9.597027e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:08,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.62905 samples/s/p 3:07:40 } +2024-07-30 03:01:10,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1454/ 3125], loss: 0.147, per_step_time: 1419ms, lr: 9.595667e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:10,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.63738 samples/s/p 3:07:20 } +2024-07-30 03:01:13,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1456/ 3125], loss: 0.250, per_step_time: 1427ms, lr: 9.594305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:13,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.60387 samples/s/p 3:08:25 } +2024-07-30 03:01:16,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1458/ 3125], loss: 0.402, per_step_time: 1418ms, lr: 9.592941e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:16,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.63945 samples/s/p 3:07:10 } +2024-07-30 03:01:19,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1460/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 9.591575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:19,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.65926 samples/s/p 3:06:28 } +2024-07-30 03:01:22,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1462/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 9.590206e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:22,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.65871 samples/s/p 3:06:26 } +2024-07-30 03:01:25,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1464/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 9.588835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:25,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.65800 samples/s/p 3:06:25 } +2024-07-30 03:01:28,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1466/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 9.587462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:28,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.65881 samples/s/p 3:06:21 } +2024-07-30 03:01:30,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1468/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 9.586086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:30,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.65736 samples/s/p 3:06:21 } +2024-07-30 03:01:33,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1470/ 3125], loss: 0.303, per_step_time: 1414ms, lr: 9.584708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:33,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.65699 samples/s/p 3:06:19 } +2024-07-30 03:01:36,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1472/ 3125], loss: 0.148, per_step_time: 1413ms, lr: 9.583328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:36,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.65903 samples/s/p 3:06:12 } +2024-07-30 03:01:39,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1474/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 9.581947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:39,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.65809 samples/s/p 3:06:11 } +2024-07-30 03:01:42,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1476/ 3125], loss: 0.335, per_step_time: 1414ms, lr: 9.580563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:42,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.65732 samples/s/p 3:06:09 } +2024-07-30 03:01:45,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1478/ 3125], loss: 0.367, per_step_time: 1413ms, lr: 9.579177e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:45,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.65886 samples/s/p 3:06:04 } +2024-07-30 03:01:47,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1480/ 3125], loss: 0.177, per_step_time: 1419ms, lr: 9.577788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:47,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.63617 samples/s/p 3:06:46 } +2024-07-30 03:01:50,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1482/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 9.576398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:50,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.65847 samples/s/p 3:05:59 } +2024-07-30 03:01:53,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1484/ 3125], loss: 0.288, per_step_time: 1415ms, lr: 9.575005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:53,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.65171 samples/s/p 3:06:09 } +2024-07-30 03:01:56,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1486/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 9.5736095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:56,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.65695 samples/s/p 3:05:56 } +2024-07-30 03:01:59,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1488/ 3125], loss: 0.203, per_step_time: 1416ms, lr: 9.572213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:59,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.64763 samples/s/p 3:06:12 } +2024-07-30 03:02:02,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1490/ 3125], loss: 0.331, per_step_time: 1412ms, lr: 9.570813e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:02,089 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.66284 samples/s/p 3:05:39 } +2024-07-30 03:02:04,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1492/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 9.569411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:04,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.65815 samples/s/p 3:05:45 } +2024-07-30 03:02:07,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1494/ 3125], loss: 0.445, per_step_time: 1413ms, lr: 9.568008e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:07,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.66160 samples/s/p 3:05:36 } +2024-07-30 03:02:10,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1496/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 9.566602e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:10,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |███████ | 5.65579 samples/s/p 3:05:44 } +2024-07-30 03:02:13,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1498/ 3125], loss: 0.205, per_step_time: 1414ms, lr: 9.565194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:13,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |███████ | 5.65644 samples/s/p 3:05:40 } +2024-07-30 03:02:16,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1500/ 3125], loss: 0.385, per_step_time: 1413ms, lr: 9.563783e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:16,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.65867 samples/s/p 3:05:33 } +2024-07-30 03:02:19,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1502/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 9.562372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:19,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.66044 samples/s/p 3:05:27 } +2024-07-30 03:02:21,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1504/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 9.560956e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:21,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.65912 samples/s/p 3:05:26 } +2024-07-30 03:02:24,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1506/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 9.55954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:24,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.66167 samples/s/p 3:05:18 } +2024-07-30 03:02:27,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1508/ 3125], loss: 0.276, per_step_time: 1414ms, lr: 9.558121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:27,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.65501 samples/s/p 3:05:29 } +2024-07-30 03:02:30,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1510/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 9.556699e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:30,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.65988 samples/s/p 3:05:16 } +2024-07-30 03:02:33,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1512/ 3125], loss: 0.125, per_step_time: 1414ms, lr: 9.555276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:33,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.65758 samples/s/p 3:05:18 } +2024-07-30 03:02:36,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1514/ 3125], loss: 0.294, per_step_time: 1413ms, lr: 9.553851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:36,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.66033 samples/s/p 3:05:10 } +2024-07-30 03:02:38,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1516/ 3125], loss: 0.127, per_step_time: 1413ms, lr: 9.552423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:38,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.65805 samples/s/p 3:05:11 } +2024-07-30 03:02:41,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1518/ 3125], loss: 0.398, per_step_time: 1413ms, lr: 9.550993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:41,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.65949 samples/s/p 3:05:06 } +2024-07-30 03:02:44,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1520/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 9.549562e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:44,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.66160 samples/s/p 3:04:59 } +2024-07-30 03:02:47,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1522/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 9.548126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:47,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.65839 samples/s/p 3:05:02 } +2024-07-30 03:02:50,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1524/ 3125], loss: 0.348, per_step_time: 1413ms, lr: 9.54669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:50,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.65840 samples/s/p 3:04:59 } +2024-07-30 03:02:53,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1526/ 3125], loss: 0.343, per_step_time: 1414ms, lr: 9.545252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:53,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.65592 samples/s/p 3:05:01 } +2024-07-30 03:02:55,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1528/ 3125], loss: 0.208, per_step_time: 1414ms, lr: 9.543812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:55,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.65744 samples/s/p 3:04:56 } +2024-07-30 03:02:58,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1530/ 3125], loss: 0.642, per_step_time: 1413ms, lr: 9.542368e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:58,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.65982 samples/s/p 3:04:48 } +2024-07-30 03:03:01,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1532/ 3125], loss: 0.652, per_step_time: 1414ms, lr: 9.540923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:01,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.65396 samples/s/p 3:04:57 } +2024-07-30 03:03:04,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1534/ 3125], loss: 0.135, per_step_time: 1414ms, lr: 9.539476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:04,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.65456 samples/s/p 3:04:53 } +2024-07-30 03:03:07,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1536/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 9.5380265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:07,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.65884 samples/s/p 3:04:42 } +2024-07-30 03:03:10,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1538/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 9.536576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:10,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.66045 samples/s/p 3:04:36 } +2024-07-30 03:03:12,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1540/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 9.5351215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:12,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.65955 samples/s/p 3:04:35 } +2024-07-30 03:03:15,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1542/ 3125], loss: 0.086, per_step_time: 1413ms, lr: 9.533665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:15,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.65971 samples/s/p 3:04:31 } +2024-07-30 03:03:18,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1544/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 9.532207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:18,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.65999 samples/s/p 3:04:28 } +2024-07-30 03:03:21,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1546/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 9.530747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:21,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.66048 samples/s/p 3:04:24 } +2024-07-30 03:03:24,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1548/ 3125], loss: 0.397, per_step_time: 1413ms, lr: 9.529285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:24,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.66004 samples/s/p 3:04:22 } +2024-07-30 03:03:27,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1550/ 3125], loss: 0.290, per_step_time: 1412ms, lr: 9.52782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:27,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.66324 samples/s/p 3:04:13 } +2024-07-30 03:03:29,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1552/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 9.526354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:29,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.65894 samples/s/p 3:04:19 } +2024-07-30 03:03:32,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1554/ 3125], loss: 0.239, per_step_time: 1414ms, lr: 9.524885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:32,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.65663 samples/s/p 3:04:21 } +2024-07-30 03:03:35,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1556/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 9.5234145e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:35,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.66006 samples/s/p 3:04:11 } +2024-07-30 03:03:38,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1558/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 9.52194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:38,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.66011 samples/s/p 3:04:08 } +2024-07-30 03:03:41,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1560/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 9.520465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:41,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.66149 samples/s/p 3:04:03 } +2024-07-30 03:03:44,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1562/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 9.518988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:44,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.65957 samples/s/p 3:04:03 } +2024-07-30 03:03:46,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1564/ 3125], loss: 0.299, per_step_time: 1414ms, lr: 9.517508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:46,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.65539 samples/s/p 3:04:09 } +2024-07-30 03:03:49,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1566/ 3125], loss: 0.421, per_step_time: 1413ms, lr: 9.516027e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:49,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.65823 samples/s/p 3:04:00 } +2024-07-30 03:03:52,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1568/ 3125], loss: 0.267, per_step_time: 1414ms, lr: 9.514542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:52,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.65742 samples/s/p 3:03:59 } +2024-07-30 03:03:55,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1570/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 9.513056e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:55,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.65813 samples/s/p 3:03:55 } +2024-07-30 03:03:58,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1572/ 3125], loss: 0.147, per_step_time: 1414ms, lr: 9.511568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:58,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.65447 samples/s/p 3:03:59 } +2024-07-30 03:04:01,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1574/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 9.510079e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:01,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.65951 samples/s/p 3:03:47 } +2024-07-30 03:04:04,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1576/ 3125], loss: 0.207, per_step_time: 1425ms, lr: 9.508584e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:04,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.61136 samples/s/p 3:05:18 } +2024-07-30 03:04:06,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1578/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 9.50709e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:06,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.65938 samples/s/p 3:03:41 } +2024-07-30 03:04:09,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1580/ 3125], loss: 0.272, per_step_time: 1414ms, lr: 9.505594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:09,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.65745 samples/s/p 3:03:42 } +2024-07-30 03:04:12,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1582/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 9.504094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:12,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.65848 samples/s/p 3:03:37 } +2024-07-30 03:04:15,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1584/ 3125], loss: 0.315, per_step_time: 1414ms, lr: 9.5025935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:15,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.65603 samples/s/p 3:03:39 } +2024-07-30 03:04:18,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1586/ 3125], loss: 0.383, per_step_time: 1416ms, lr: 9.50109e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:18,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.64871 samples/s/p 3:03:51 } +2024-07-30 03:04:21,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1588/ 3125], loss: 0.414, per_step_time: 1414ms, lr: 9.499584e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:21,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.65706 samples/s/p 3:03:32 } +2024-07-30 03:04:23,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1590/ 3125], loss: 0.183, per_step_time: 1414ms, lr: 9.498076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:23,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.65414 samples/s/p 3:03:34 } +2024-07-30 03:04:26,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1592/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 9.496567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:26,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.65963 samples/s/p 3:03:21 } +2024-07-30 03:04:29,521 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1594/ 3125], loss: 0.227, per_step_time: 1414ms, lr: 9.495055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:29,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.65399 samples/s/p 3:03:29 } +2024-07-30 03:04:32,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1596/ 3125], loss: 0.182, per_step_time: 1414ms, lr: 9.49354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:32,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.65761 samples/s/p 3:03:19 } +2024-07-30 03:04:35,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1598/ 3125], loss: 0.253, per_step_time: 1414ms, lr: 9.492024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:35,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.65401 samples/s/p 3:03:23 } +2024-07-30 03:04:38,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1600/ 3125], loss: 0.272, per_step_time: 1414ms, lr: 9.490506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:38,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.65512 samples/s/p 3:03:18 } +2024-07-30 03:04:40,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1602/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 9.488986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:40,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.66027 samples/s/p 3:03:06 } +2024-07-30 03:04:43,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1604/ 3125], loss: 0.450, per_step_time: 1412ms, lr: 9.487463e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:43,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.66311 samples/s/p 3:02:57 } +2024-07-30 03:04:46,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1606/ 3125], loss: 0.407, per_step_time: 1413ms, lr: 9.485938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:46,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.65982 samples/s/p 3:03:01 } +2024-07-30 03:04:49,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1608/ 3125], loss: 0.170, per_step_time: 1414ms, lr: 9.484411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:49,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.65563 samples/s/p 3:03:06 } +2024-07-30 03:04:52,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1610/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 9.482882e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:52,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.65877 samples/s/p 3:02:57 } +2024-07-30 03:04:55,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1612/ 3125], loss: 0.373, per_step_time: 1414ms, lr: 9.48135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:55,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.65688 samples/s/p 3:02:58 } +2024-07-30 03:04:57,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1614/ 3125], loss: 0.432, per_step_time: 1413ms, lr: 9.479818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:57,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.66092 samples/s/p 3:02:47 } +2024-07-30 03:05:00,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1616/ 3125], loss: 0.367, per_step_time: 1413ms, lr: 9.478282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:00,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.66024 samples/s/p 3:02:46 } +2024-07-30 03:05:03,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1618/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 9.476745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:03,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.65866 samples/s/p 3:02:46 } +2024-07-30 03:05:06,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1620/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 9.475205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:06,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.66114 samples/s/p 3:02:38 } +2024-07-30 03:05:09,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1622/ 3125], loss: 0.099, per_step_time: 1413ms, lr: 9.473662e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:09,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.66055 samples/s/p 3:02:37 } +2024-07-30 03:05:12,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1624/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 9.472118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:12,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.66014 samples/s/p 3:02:35 } +2024-07-30 03:05:14,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1626/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 9.470572e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:14,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.66139 samples/s/p 3:02:29 } +2024-07-30 03:05:17,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1628/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 9.469024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:17,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.65977 samples/s/p 3:02:30 } +2024-07-30 03:05:20,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1630/ 3125], loss: 0.332, per_step_time: 1412ms, lr: 9.467472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:20,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.66197 samples/s/p 3:02:23 } +2024-07-30 03:05:23,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1632/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 9.465921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:23,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.66163 samples/s/p 3:02:21 } +2024-07-30 03:05:26,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1634/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 9.4643665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:26,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.65849 samples/s/p 3:02:24 } +2024-07-30 03:05:29,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1636/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 9.4628085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:29,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.66003 samples/s/p 3:02:18 } +2024-07-30 03:05:31,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1638/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 9.46125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:31,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.65906 samples/s/p 3:02:17 } +2024-07-30 03:05:34,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1640/ 3125], loss: 0.387, per_step_time: 1412ms, lr: 9.459689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:34,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.66183 samples/s/p 3:02:09 } +2024-07-30 03:05:37,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1642/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 9.4581255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:37,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.65813 samples/s/p 3:02:13 } +2024-07-30 03:05:40,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1644/ 3125], loss: 0.134, per_step_time: 1415ms, lr: 9.45656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:40,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.65116 samples/s/p 3:02:24 } +2024-07-30 03:05:43,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1646/ 3125], loss: 0.243, per_step_time: 1414ms, lr: 9.454992e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:43,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.65613 samples/s/p 3:02:11 } +2024-07-30 03:05:46,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1648/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 9.453423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:46,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.65776 samples/s/p 3:02:05 } +2024-07-30 03:05:48,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1650/ 3125], loss: 0.204, per_step_time: 1415ms, lr: 9.451852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:48,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.65352 samples/s/p 3:02:11 } +2024-07-30 03:05:51,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1652/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 9.450278e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:51,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.65833 samples/s/p 3:01:59 } +2024-07-30 03:05:54,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1654/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 9.448701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:54,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.66116 samples/s/p 3:01:50 } +2024-07-30 03:05:57,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1656/ 3125], loss: 0.512, per_step_time: 1413ms, lr: 9.447123e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:57,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.66095 samples/s/p 3:01:48 } +2024-07-30 03:06:00,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1658/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 9.445543e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:00,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.65927 samples/s/p 3:01:48 } +2024-07-30 03:06:03,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1660/ 3125], loss: 0.321, per_step_time: 1413ms, lr: 9.443961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:03,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.66145 samples/s/p 3:01:41 } +2024-07-30 03:06:05,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1662/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 9.442376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:05,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.65940 samples/s/p 3:01:42 } +2024-07-30 03:06:08,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1664/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 9.44079e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:08,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.65838 samples/s/p 3:01:42 } +2024-07-30 03:06:11,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1666/ 3125], loss: 0.313, per_step_time: 1412ms, lr: 9.439201e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:11,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.66351 samples/s/p 3:01:29 } +2024-07-30 03:06:14,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1668/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 9.43761e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:14,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.65831 samples/s/p 3:01:36 } +2024-07-30 03:06:17,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1670/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 9.436017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:17,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.66107 samples/s/p 3:01:28 } +2024-07-30 03:06:20,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1672/ 3125], loss: 0.287, per_step_time: 1414ms, lr: 9.434422e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:20,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.65546 samples/s/p 3:01:36 } +2024-07-30 03:06:22,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1674/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 9.432824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:22,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.65993 samples/s/p 3:01:24 } +2024-07-30 03:06:25,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1676/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 9.431225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:25,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.66141 samples/s/p 3:01:19 } +2024-07-30 03:06:28,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1678/ 3125], loss: 0.519, per_step_time: 1413ms, lr: 9.429624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:28,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.66012 samples/s/p 3:01:18 } +2024-07-30 03:06:31,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1680/ 3125], loss: 0.228, per_step_time: 1414ms, lr: 9.42802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:31,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.65502 samples/s/p 3:01:25 } +2024-07-30 03:06:34,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1682/ 3125], loss: 0.395, per_step_time: 1414ms, lr: 9.426415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:34,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.65671 samples/s/p 3:01:19 } +2024-07-30 03:06:37,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1684/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 9.424806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:37,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |████████ | 5.65818 samples/s/p 3:01:14 } +2024-07-30 03:06:39,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1686/ 3125], loss: 0.527, per_step_time: 1412ms, lr: 9.423197e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:39,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |████████ | 5.66186 samples/s/p 3:01:04 } +2024-07-30 03:06:42,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1688/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 9.421586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:42,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.65902 samples/s/p 3:01:06 } +2024-07-30 03:06:45,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1690/ 3125], loss: 0.398, per_step_time: 1413ms, lr: 9.419971e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:45,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.66141 samples/s/p 3:00:59 } +2024-07-30 03:06:48,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1692/ 3125], loss: 0.388, per_step_time: 1413ms, lr: 9.418355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:48,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.66084 samples/s/p 3:00:57 } +2024-07-30 03:06:51,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1694/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 9.416737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:51,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.66032 samples/s/p 3:00:55 } +2024-07-30 03:06:54,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1696/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 9.415116e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:54,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.66152 samples/s/p 3:00:50 } +2024-07-30 03:06:56,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1698/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 9.413494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:56,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.65886 samples/s/p 3:00:53 } +2024-07-30 03:06:59,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1700/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 9.411869e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:59,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.65785 samples/s/p 3:00:52 } +2024-07-30 03:07:02,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1702/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 9.410242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:02,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.66006 samples/s/p 3:00:45 } +2024-07-30 03:07:05,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1704/ 3125], loss: 0.429, per_step_time: 1414ms, lr: 9.408614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:05,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.65599 samples/s/p 3:00:50 } +2024-07-30 03:07:08,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1706/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 9.406983e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:08,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.66062 samples/s/p 3:00:38 } +2024-07-30 03:07:11,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1708/ 3125], loss: 0.098, per_step_time: 1414ms, lr: 9.4053485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:11,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.65661 samples/s/p 3:00:43 } +2024-07-30 03:07:13,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1710/ 3125], loss: 0.097, per_step_time: 1413ms, lr: 9.403714e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:13,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.65986 samples/s/p 3:00:34 } +2024-07-30 03:07:16,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1712/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 9.402076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:16,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.66066 samples/s/p 3:00:29 } +2024-07-30 03:07:19,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1714/ 3125], loss: 0.400, per_step_time: 1413ms, lr: 9.400437e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:19,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.66004 samples/s/p 3:00:28 } +2024-07-30 03:07:22,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1716/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 9.398796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:22,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.66129 samples/s/p 3:00:22 } +2024-07-30 03:07:25,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1718/ 3125], loss: 0.398, per_step_time: 1413ms, lr: 9.397152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:25,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.65985 samples/s/p 3:00:22 } +2024-07-30 03:07:28,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1720/ 3125], loss: 0.358, per_step_time: 1414ms, lr: 9.395506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:28,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.65649 samples/s/p 3:00:26 } +2024-07-30 03:07:30,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1722/ 3125], loss: 0.214, per_step_time: 1414ms, lr: 9.393859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:30,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.65683 samples/s/p 3:00:23 } +2024-07-30 03:07:33,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1724/ 3125], loss: 0.141, per_step_time: 1414ms, lr: 9.392209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:33,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.65449 samples/s/p 3:00:24 } +2024-07-30 03:07:36,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1726/ 3125], loss: 0.149, per_step_time: 1417ms, lr: 9.390556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:36,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.64557 samples/s/p 3:00:38 } +2024-07-30 03:07:39,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1728/ 3125], loss: 0.275, per_step_time: 1414ms, lr: 9.388902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:39,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.65652 samples/s/p 3:00:15 } +2024-07-30 03:07:42,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1730/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 9.387246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:42,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.66117 samples/s/p 3:00:03 } +2024-07-30 03:07:45,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1732/ 3125], loss: 0.168, per_step_time: 1414ms, lr: 9.385587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:45,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.65573 samples/s/p 3:00:10 } +2024-07-30 03:07:47,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1734/ 3125], loss: 0.273, per_step_time: 1414ms, lr: 9.383927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:47,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.65594 samples/s/p 3:00:07 } +2024-07-30 03:07:50,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1736/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 9.382265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:50,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.66015 samples/s/p 2:59:56 } +2024-07-30 03:07:53,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1738/ 3125], loss: 0.343, per_step_time: 1414ms, lr: 9.380601e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:53,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.65657 samples/s/p 3:00:00 } +2024-07-30 03:07:56,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1740/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 9.378934e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:56,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.66031 samples/s/p 2:59:50 } +2024-07-30 03:07:59,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1742/ 3125], loss: 0.164, per_step_time: 1415ms, lr: 9.377265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:59,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.65343 samples/s/p 3:00:01 } +2024-07-30 03:08:02,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1744/ 3125], loss: 0.365, per_step_time: 1412ms, lr: 9.375594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:02,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.66231 samples/s/p 2:59:41 } +2024-07-30 03:08:04,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1746/ 3125], loss: 0.208, per_step_time: 1412ms, lr: 9.373922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:04,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.66226 samples/s/p 2:59:38 } +2024-07-30 03:08:07,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1748/ 3125], loss: 0.301, per_step_time: 1414ms, lr: 9.3722465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:07,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.65767 samples/s/p 2:59:44 } +2024-07-30 03:08:10,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1750/ 3125], loss: 0.379, per_step_time: 1413ms, lr: 9.3705685e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:10,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.66162 samples/s/p 2:59:34 } +2024-07-30 03:08:13,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1752/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 9.3688905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:13,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.66035 samples/s/p 2:59:33 } +2024-07-30 03:08:16,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1754/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 9.367209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:16,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.66055 samples/s/p 2:59:30 } +2024-07-30 03:08:19,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1756/ 3125], loss: 0.423, per_step_time: 1414ms, lr: 9.365525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:19,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.65763 samples/s/p 2:59:33 } +2024-07-30 03:08:21,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1758/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 9.363841e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:21,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.66017 samples/s/p 2:59:25 } +2024-07-30 03:08:24,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1760/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 9.362153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:24,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.66095 samples/s/p 2:59:21 } +2024-07-30 03:08:27,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1762/ 3125], loss: 0.590, per_step_time: 1413ms, lr: 9.360463e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:27,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.65926 samples/s/p 2:59:21 } +2024-07-30 03:08:30,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1764/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 9.358771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:30,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.65791 samples/s/p 2:59:21 } +2024-07-30 03:08:33,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1766/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 9.357077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:33,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.66064 samples/s/p 2:59:13 } +2024-07-30 03:08:36,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1768/ 3125], loss: 0.256, per_step_time: 1417ms, lr: 9.355382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:36,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.64180 samples/s/p 2:59:46 } +2024-07-30 03:08:38,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1770/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 9.353684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:38,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.66130 samples/s/p 2:59:06 } +2024-07-30 03:08:41,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1772/ 3125], loss: 0.327, per_step_time: 1413ms, lr: 9.351984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:41,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.66096 samples/s/p 2:59:04 } +2024-07-30 03:08:44,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1774/ 3125], loss: 0.134, per_step_time: 1413ms, lr: 9.350281e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:44,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.65946 samples/s/p 2:59:04 } +2024-07-30 03:08:47,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1776/ 3125], loss: 0.391, per_step_time: 1412ms, lr: 9.348578e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:47,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.66173 samples/s/p 2:58:57 } +2024-07-30 03:08:50,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1778/ 3125], loss: 0.383, per_step_time: 1413ms, lr: 9.346872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:50,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.66014 samples/s/p 2:58:57 } +2024-07-30 03:08:53,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1780/ 3125], loss: 0.366, per_step_time: 1412ms, lr: 9.345163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:53,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.66191 samples/s/p 2:58:51 } +2024-07-30 03:08:55,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1782/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 9.343452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:55,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.65947 samples/s/p 2:58:53 } +2024-07-30 03:08:58,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1784/ 3125], loss: 0.436, per_step_time: 1413ms, lr: 9.341739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:58,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.65888 samples/s/p 2:58:51 } +2024-07-30 03:09:01,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1786/ 3125], loss: 0.294, per_step_time: 1414ms, lr: 9.340025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:01,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.65466 samples/s/p 2:58:56 } +2024-07-30 03:09:04,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1788/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 9.338309e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:04,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.65781 samples/s/p 2:58:47 } +2024-07-30 03:09:07,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1790/ 3125], loss: 0.432, per_step_time: 1413ms, lr: 9.33659e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:07,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.65880 samples/s/p 2:58:43 } +2024-07-30 03:09:10,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1792/ 3125], loss: 0.356, per_step_time: 1414ms, lr: 9.334869e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:10,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.65715 samples/s/p 2:58:43 } +2024-07-30 03:09:12,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1794/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 9.333146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:12,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.65812 samples/s/p 2:58:38 } +2024-07-30 03:09:15,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1796/ 3125], loss: 0.225, per_step_time: 1414ms, lr: 9.331422e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:15,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.65647 samples/s/p 2:58:39 } +2024-07-30 03:09:18,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1798/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 9.329694e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:18,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.65786 samples/s/p 2:58:33 } +2024-07-30 03:09:21,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1800/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 9.327966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:21,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.65825 samples/s/p 2:58:30 } +2024-07-30 03:09:24,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1802/ 3125], loss: 0.242, per_step_time: 1414ms, lr: 9.326234e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:24,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.65596 samples/s/p 2:58:31 } +2024-07-30 03:09:27,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1804/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 9.324502e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:27,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.66048 samples/s/p 2:58:20 } +2024-07-30 03:09:29,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1806/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 9.322765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:29,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.65946 samples/s/p 2:58:19 } +2024-07-30 03:09:32,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1808/ 3125], loss: 0.160, per_step_time: 1413ms, lr: 9.321029e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:32,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.65909 samples/s/p 2:58:17 } +2024-07-30 03:09:35,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1810/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 9.319289e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:35,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.66005 samples/s/p 2:58:12 } +2024-07-30 03:09:38,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1812/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 9.317549e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:38,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.65887 samples/s/p 2:58:11 } +2024-07-30 03:09:41,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1814/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 9.315804e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:41,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.66058 samples/s/p 2:58:05 } +2024-07-30 03:09:44,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1816/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 9.314059e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:44,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.65967 samples/s/p 2:58:04 } +2024-07-30 03:09:46,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1818/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 9.312312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:46,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.65979 samples/s/p 2:58:01 } +2024-07-30 03:09:49,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1820/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 9.310561e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:49,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.66058 samples/s/p 2:57:57 } +2024-07-30 03:09:52,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1822/ 3125], loss: 0.357, per_step_time: 1413ms, lr: 9.30881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:52,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.66003 samples/s/p 2:57:55 } +2024-07-30 03:09:55,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1824/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 9.307057e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:55,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.66130 samples/s/p 2:57:50 } +2024-07-30 03:09:58,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1826/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 9.3053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:58,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.66094 samples/s/p 2:57:48 } +2024-07-30 03:10:01,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1828/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 9.303542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:01,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.66004 samples/s/p 2:57:47 } +2024-07-30 03:10:03,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1830/ 3125], loss: 0.334, per_step_time: 1413ms, lr: 9.3017825e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:03,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.65943 samples/s/p 2:57:45 } +2024-07-30 03:10:06,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1832/ 3125], loss: 0.160, per_step_time: 1414ms, lr: 9.300021e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:06,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.65494 samples/s/p 2:57:51 } +2024-07-30 03:10:09,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1834/ 3125], loss: 0.279, per_step_time: 1414ms, lr: 9.298256e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:09,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.65647 samples/s/p 2:57:45 } +2024-07-30 03:10:12,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1836/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 9.296491e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:12,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.66159 samples/s/p 2:57:32 } +2024-07-30 03:10:15,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1838/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 9.294722e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:15,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.66042 samples/s/p 2:57:32 } +2024-07-30 03:10:18,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1840/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 9.292952e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:18,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.66160 samples/s/p 2:57:27 } +2024-07-30 03:10:20,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1842/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 9.2911805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:20,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.65914 samples/s/p 2:57:28 } +2024-07-30 03:10:23,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1844/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 9.289406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:23,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.66025 samples/s/p 2:57:24 } +2024-07-30 03:10:26,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1846/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 9.28763e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:26,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.65918 samples/s/p 2:57:23 } +2024-07-30 03:10:29,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1848/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 9.285851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:29,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.65874 samples/s/p 2:57:21 } +2024-07-30 03:10:32,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1850/ 3125], loss: 0.507, per_step_time: 1413ms, lr: 9.28407e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:32,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.66058 samples/s/p 2:57:14 } +2024-07-30 03:10:35,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1852/ 3125], loss: 0.280, per_step_time: 1414ms, lr: 9.282288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:35,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.65567 samples/s/p 2:57:21 } +2024-07-30 03:10:37,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1854/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 9.280503e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:37,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.65787 samples/s/p 2:57:14 } +2024-07-30 03:10:40,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1856/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 9.278717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:40,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.66034 samples/s/p 2:57:06 } +2024-07-30 03:10:43,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1858/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 9.276928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:43,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.65795 samples/s/p 2:57:08 } +2024-07-30 03:10:46,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1860/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 9.275138e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:46,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.66055 samples/s/p 2:57:00 } +2024-07-30 03:10:49,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1862/ 3125], loss: 0.399, per_step_time: 1413ms, lr: 9.273345e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:49,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.66127 samples/s/p 2:56:56 } +2024-07-30 03:10:52,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1864/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 9.271551e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:52,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.66005 samples/s/p 2:56:56 } +2024-07-30 03:10:54,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1866/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 9.269754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:54,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.66014 samples/s/p 2:56:53 } +2024-07-30 03:10:57,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1868/ 3125], loss: 0.055, per_step_time: 1414ms, lr: 9.267955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:57,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.65496 samples/s/p 2:57:00 } +2024-07-30 03:11:00,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1870/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 9.266154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:00,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.66160 samples/s/p 2:56:44 } +2024-07-30 03:11:03,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1872/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 9.264351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:03,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |█████████ | 5.65957 samples/s/p 2:56:45 } +2024-07-30 03:11:06,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1874/ 3125], loss: 0.366, per_step_time: 1414ms, lr: 9.262546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:06,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |█████████ | 5.65479 samples/s/p 2:56:51 } +2024-07-30 03:11:09,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1876/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 9.260739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:09,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.65848 samples/s/p 2:56:42 } +2024-07-30 03:11:11,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1878/ 3125], loss: 0.410, per_step_time: 1414ms, lr: 9.258931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:11,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.65490 samples/s/p 2:56:46 } +2024-07-30 03:11:14,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1880/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 9.257119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:14,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.66131 samples/s/p 2:56:31 } +2024-07-30 03:11:17,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1882/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 9.255306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:17,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.65844 samples/s/p 2:56:33 } +2024-07-30 03:11:20,521 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1884/ 3125], loss: 0.320, per_step_time: 1428ms, lr: 9.253491e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:20,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.60050 samples/s/p 2:58:20 } +2024-07-30 03:11:23,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1886/ 3125], loss: 0.366, per_step_time: 1412ms, lr: 9.251674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:23,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.66175 samples/s/p 2:56:21 } +2024-07-30 03:11:26,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1888/ 3125], loss: 0.145, per_step_time: 1414ms, lr: 9.249855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:26,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.65605 samples/s/p 2:56:29 } +2024-07-30 03:11:29,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1890/ 3125], loss: 0.278, per_step_time: 1412ms, lr: 9.248033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:29,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.66189 samples/s/p 2:56:15 } +2024-07-30 03:11:31,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1892/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 9.24621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:31,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.65943 samples/s/p 2:56:17 } +2024-07-30 03:11:34,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1894/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 9.244384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:34,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.66091 samples/s/p 2:56:12 } +2024-07-30 03:11:37,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1896/ 3125], loss: 0.125, per_step_time: 1413ms, lr: 9.242558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:37,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.65998 samples/s/p 2:56:11 } +2024-07-30 03:11:40,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1898/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 9.240728e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:40,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.65911 samples/s/p 2:56:09 } +2024-07-30 03:11:43,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1900/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 9.238896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:43,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.66079 samples/s/p 2:56:03 } +2024-07-30 03:11:46,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1902/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 9.237063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:46,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.65952 samples/s/p 2:56:03 } +2024-07-30 03:11:48,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1904/ 3125], loss: 0.442, per_step_time: 1413ms, lr: 9.235228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:48,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.65928 samples/s/p 2:56:01 } +2024-07-30 03:11:51,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1906/ 3125], loss: 0.151, per_step_time: 1413ms, lr: 9.233391e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:51,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.66095 samples/s/p 2:55:55 } +2024-07-30 03:11:54,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1908/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 9.231551e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:54,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.66111 samples/s/p 2:55:51 } +2024-07-30 03:11:57,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1910/ 3125], loss: 0.381, per_step_time: 1413ms, lr: 9.22971e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:57,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.66023 samples/s/p 2:55:50 } +2024-07-30 03:12:00,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1912/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 9.227867e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:00,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.66060 samples/s/p 2:55:47 } +2024-07-30 03:12:03,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1914/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 9.226022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:03,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.66009 samples/s/p 2:55:45 } +2024-07-30 03:12:05,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1916/ 3125], loss: 0.279, per_step_time: 1412ms, lr: 9.2241735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:05,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.66192 samples/s/p 2:55:39 } +2024-07-30 03:12:08,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1918/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 9.222324e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:08,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.65969 samples/s/p 2:55:40 } +2024-07-30 03:12:11,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1920/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 9.220473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:11,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.66095 samples/s/p 2:55:35 } +2024-07-30 03:12:14,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1922/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 9.218618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:14,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.65838 samples/s/p 2:55:37 } +2024-07-30 03:12:17,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1924/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 9.216764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:17,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.66020 samples/s/p 2:55:31 } +2024-07-30 03:12:20,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1926/ 3125], loss: 0.110, per_step_time: 1413ms, lr: 9.214905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:20,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.66099 samples/s/p 2:55:26 } +2024-07-30 03:12:22,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1928/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 9.213046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:22,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.65773 samples/s/p 2:55:30 } +2024-07-30 03:12:25,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1930/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 9.211185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:25,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.66168 samples/s/p 2:55:19 } +2024-07-30 03:12:28,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1932/ 3125], loss: 0.282, per_step_time: 1414ms, lr: 9.209321e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:28,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.65480 samples/s/p 2:55:29 } +2024-07-30 03:12:31,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1934/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 9.207456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:31,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.66106 samples/s/p 2:55:15 } +2024-07-30 03:12:34,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1936/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 9.205588e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:34,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.65856 samples/s/p 2:55:17 } +2024-07-30 03:12:37,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1938/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 9.203719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:37,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.65994 samples/s/p 2:55:11 } +2024-07-30 03:12:39,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1940/ 3125], loss: 0.444, per_step_time: 1414ms, lr: 9.201847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:39,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.65563 samples/s/p 2:55:16 } +2024-07-30 03:12:42,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1942/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 9.199974e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:42,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.65708 samples/s/p 2:55:11 } +2024-07-30 03:12:45,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1944/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 9.198097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:45,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.66131 samples/s/p 2:55:00 } +2024-07-30 03:12:48,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1946/ 3125], loss: 0.379, per_step_time: 1413ms, lr: 9.19622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:48,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.65812 samples/s/p 2:55:03 } +2024-07-30 03:12:51,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1948/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 9.19434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:51,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.65911 samples/s/p 2:54:59 } +2024-07-30 03:12:54,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1950/ 3125], loss: 0.079, per_step_time: 1413ms, lr: 9.192459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:54,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.65826 samples/s/p 2:54:57 } +2024-07-30 03:12:56,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1952/ 3125], loss: 0.346, per_step_time: 1414ms, lr: 9.190576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:56,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.65622 samples/s/p 2:54:58 } +2024-07-30 03:12:59,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1954/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 9.18869e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:59,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.65872 samples/s/p 2:54:51 } +2024-07-30 03:13:02,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1956/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 9.186801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:02,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.65943 samples/s/p 2:54:47 } +2024-07-30 03:13:05,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1958/ 3125], loss: 0.354, per_step_time: 1412ms, lr: 9.184912e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:05,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.66325 samples/s/p 2:54:37 } +2024-07-30 03:13:08,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1960/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 9.183021e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:08,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.66168 samples/s/p 2:54:37 } +2024-07-30 03:13:11,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1962/ 3125], loss: 0.341, per_step_time: 1413ms, lr: 9.181127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:11,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.65856 samples/s/p 2:54:40 } +2024-07-30 03:13:13,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1964/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 9.179231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:13,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.66024 samples/s/p 2:54:34 } +2024-07-30 03:13:16,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1966/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 9.1773345e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:16,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.66113 samples/s/p 2:54:29 } +2024-07-30 03:13:19,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1968/ 3125], loss: 0.075, per_step_time: 1413ms, lr: 9.175434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:19,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.65864 samples/s/p 2:54:31 } +2024-07-30 03:13:22,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1970/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 9.173533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:22,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.66123 samples/s/p 2:54:24 } +2024-07-30 03:13:25,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1972/ 3125], loss: 0.377, per_step_time: 1413ms, lr: 9.171628e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:25,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.66122 samples/s/p 2:54:21 } +2024-07-30 03:13:28,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1974/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 9.169723e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:28,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.66113 samples/s/p 2:54:18 } +2024-07-30 03:13:30,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1976/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 9.167815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:30,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.66036 samples/s/p 2:54:17 } +2024-07-30 03:13:33,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1978/ 3125], loss: 0.148, per_step_time: 1414ms, lr: 9.165906e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:33,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.65582 samples/s/p 2:54:22 } +2024-07-30 03:13:36,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1980/ 3125], loss: 0.399, per_step_time: 1413ms, lr: 9.163994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:36,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.66031 samples/s/p 2:54:11 } +2024-07-30 03:13:39,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1982/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 9.1620805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:39,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.65962 samples/s/p 2:54:10 } +2024-07-30 03:13:42,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1984/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 9.160166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:42,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.66131 samples/s/p 2:54:04 } +2024-07-30 03:13:45,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1986/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 9.158248e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:45,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.66119 samples/s/p 2:54:01 } +2024-07-30 03:13:47,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1988/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 9.156328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:47,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.66027 samples/s/p 2:54:00 } +2024-07-30 03:13:50,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1990/ 3125], loss: 0.410, per_step_time: 1413ms, lr: 9.154406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:50,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.66171 samples/s/p 2:53:55 } +2024-07-30 03:13:53,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1992/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 9.1524835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:53,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.66035 samples/s/p 2:53:54 } +2024-07-30 03:13:56,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1994/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 9.150557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:56,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.66005 samples/s/p 2:53:52 } +2024-07-30 03:13:59,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1996/ 3125], loss: 0.112, per_step_time: 1412ms, lr: 9.14863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:59,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.66191 samples/s/p 2:53:46 } +2024-07-30 03:14:02,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1998/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 9.1467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:02,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.66116 samples/s/p 2:53:44 } +2024-07-30 03:14:04,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2000/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 9.144769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:04,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.66102 samples/s/p 2:53:42 } +2024-07-30 03:14:07,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2002/ 3125], loss: 0.148, per_step_time: 1413ms, lr: 9.1428365e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:07,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.65800 samples/s/p 2:53:44 } +2024-07-30 03:14:10,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2004/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 9.140901e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:10,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.65960 samples/s/p 2:53:39 } +2024-07-30 03:14:13,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2006/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 9.138963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:13,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.66021 samples/s/p 2:53:35 } +2024-07-30 03:14:16,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2008/ 3125], loss: 0.285, per_step_time: 1415ms, lr: 9.137024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:16,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.65315 samples/s/p 2:53:45 } +2024-07-30 03:14:19,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2010/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 9.135083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:19,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.65834 samples/s/p 2:53:32 } +2024-07-30 03:14:21,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2012/ 3125], loss: 0.333, per_step_time: 1412ms, lr: 9.1331385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:21,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.66187 samples/s/p 2:53:23 } +2024-07-30 03:14:24,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2014/ 3125], loss: 0.167, per_step_time: 1414ms, lr: 9.131193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:24,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.65451 samples/s/p 2:53:34 } +2024-07-30 03:14:27,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2016/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 9.129246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:27,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.65830 samples/s/p 2:53:24 } +2024-07-30 03:14:30,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2018/ 3125], loss: 0.382, per_step_time: 1414ms, lr: 9.127297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:30,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.65570 samples/s/p 2:53:26 } +2024-07-30 03:14:33,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2020/ 3125], loss: 0.444, per_step_time: 1413ms, lr: 9.125346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:33,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.66153 samples/s/p 2:53:12 } +2024-07-30 03:14:36,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2022/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 9.123393e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:36,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.65963 samples/s/p 2:53:13 } +2024-07-30 03:14:38,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2024/ 3125], loss: 0.321, per_step_time: 1414ms, lr: 9.121438e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:38,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.65584 samples/s/p 2:53:17 } +2024-07-30 03:14:41,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2026/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 9.119481e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:41,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.65877 samples/s/p 2:53:09 } +2024-07-30 03:14:44,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2028/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 9.117522e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:44,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.65838 samples/s/p 2:53:07 } +2024-07-30 03:14:47,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2030/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 9.11556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:47,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.66082 samples/s/p 2:53:00 } +2024-07-30 03:14:50,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2032/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 9.113598e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:50,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.65795 samples/s/p 2:53:02 } +2024-07-30 03:14:53,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2034/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 9.1116335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:53,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.65878 samples/s/p 2:52:58 } +2024-07-30 03:14:55,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2036/ 3125], loss: 0.398, per_step_time: 1413ms, lr: 9.109666e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:55,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.65966 samples/s/p 2:52:53 } +2024-07-30 03:14:58,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2038/ 3125], loss: 0.288, per_step_time: 1414ms, lr: 9.107697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:58,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.65677 samples/s/p 2:52:56 } +2024-07-30 03:15:01,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2040/ 3125], loss: 0.238, per_step_time: 1414ms, lr: 9.105726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:01,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.65590 samples/s/p 2:52:55 } +2024-07-30 03:15:04,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2042/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 9.103754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:04,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.66061 samples/s/p 2:52:43 } +2024-07-30 03:15:07,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2044/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 9.101778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:07,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.65971 samples/s/p 2:52:42 } +2024-07-30 03:15:10,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2046/ 3125], loss: 0.397, per_step_time: 1413ms, lr: 9.099802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:10,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.66120 samples/s/p 2:52:36 } +2024-07-30 03:15:12,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2048/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 9.097823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:12,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.66158 samples/s/p 2:52:33 } +2024-07-30 03:15:15,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2050/ 3125], loss: 0.395, per_step_time: 1412ms, lr: 9.095843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:15,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.66176 samples/s/p 2:52:30 } +2024-07-30 03:15:18,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2052/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 9.09386e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:18,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.65857 samples/s/p 2:52:33 } +2024-07-30 03:15:21,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2054/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 9.091876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:21,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.66114 samples/s/p 2:52:25 } +2024-07-30 03:15:24,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2056/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 9.089889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:24,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.66165 samples/s/p 2:52:21 } +2024-07-30 03:15:27,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2058/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 9.0879e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:27,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.66078 samples/s/p 2:52:20 } +2024-07-30 03:15:29,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2060/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 9.08591e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:29,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.65903 samples/s/p 2:52:21 } +2024-07-30 03:15:32,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2062/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 9.0839185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:32,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.66083 samples/s/p 2:52:14 } +2024-07-30 03:15:35,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2064/ 3125], loss: 0.192, per_step_time: 1414ms, lr: 9.081924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:35,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |███████████ | 5.65567 samples/s/p 2:52:21 } +2024-07-30 03:15:38,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2066/ 3125], loss: 0.354, per_step_time: 1414ms, lr: 9.079927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:38,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |███████████ | 5.65656 samples/s/p 2:52:17 } +2024-07-30 03:15:41,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2068/ 3125], loss: 0.349, per_step_time: 1414ms, lr: 9.0779295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:41,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.65680 samples/s/p 2:52:13 } +2024-07-30 03:15:44,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2070/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 9.0759295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:44,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.66159 samples/s/p 2:52:02 } +2024-07-30 03:15:46,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2072/ 3125], loss: 0.483, per_step_time: 1413ms, lr: 9.073927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:46,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.65833 samples/s/p 2:52:05 } +2024-07-30 03:15:49,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2074/ 3125], loss: 0.206, per_step_time: 1415ms, lr: 9.071923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:49,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.65332 samples/s/p 2:52:11 } +2024-07-30 03:15:52,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2076/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 9.069917e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:52,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.66056 samples/s/p 2:51:55 } +2024-07-30 03:15:55,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2078/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 9.06791e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:55,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.66100 samples/s/p 2:51:51 } +2024-07-30 03:15:58,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2080/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 9.0659e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:58,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.66096 samples/s/p 2:51:49 } +2024-07-30 03:16:01,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2082/ 3125], loss: 0.082, per_step_time: 1413ms, lr: 9.063888e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:01,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.65784 samples/s/p 2:51:52 } +2024-07-30 03:16:03,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2084/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 9.061873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:03,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.65933 samples/s/p 2:51:46 } +2024-07-30 03:16:06,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2086/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 9.059858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:06,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.66078 samples/s/p 2:51:41 } +2024-07-30 03:16:09,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2088/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 9.0578405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:09,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.65790 samples/s/p 2:51:43 } +2024-07-30 03:16:12,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2090/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 9.0558215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:12,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.66053 samples/s/p 2:51:35 } +2024-07-30 03:16:15,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2092/ 3125], loss: 0.397, per_step_time: 1413ms, lr: 9.0538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:15,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.65939 samples/s/p 2:51:35 } +2024-07-30 03:16:18,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2094/ 3125], loss: 0.323, per_step_time: 1413ms, lr: 9.051776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:18,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.66135 samples/s/p 2:51:28 } +2024-07-30 03:16:20,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2096/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 9.049751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:20,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.66052 samples/s/p 2:51:27 } +2024-07-30 03:16:23,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2098/ 3125], loss: 0.217, per_step_time: 1414ms, lr: 9.047724e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:23,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.65548 samples/s/p 2:51:33 } +2024-07-30 03:16:26,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2100/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 9.045693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:26,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.65884 samples/s/p 2:51:24 } +2024-07-30 03:16:29,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2102/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 9.043662e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:29,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.66091 samples/s/p 2:51:18 } +2024-07-30 03:16:32,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2104/ 3125], loss: 0.235, per_step_time: 1414ms, lr: 9.04163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:32,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.65444 samples/s/p 2:51:27 } +2024-07-30 03:16:35,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2106/ 3125], loss: 0.336, per_step_time: 1412ms, lr: 9.039595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:35,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.66209 samples/s/p 2:51:10 } +2024-07-30 03:16:37,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2108/ 3125], loss: 0.154, per_step_time: 1414ms, lr: 9.037558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:37,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.65543 samples/s/p 2:51:19 } +2024-07-30 03:16:40,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2110/ 3125], loss: 0.134, per_step_time: 1412ms, lr: 9.035519e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:40,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.66205 samples/s/p 2:51:04 } +2024-07-30 03:16:43,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2112/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 9.033478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:43,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.65886 samples/s/p 2:51:07 } +2024-07-30 03:16:46,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2114/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 9.031435e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:46,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.65839 samples/s/p 2:51:05 } +2024-07-30 03:16:49,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2116/ 3125], loss: 0.236, per_step_time: 1412ms, lr: 9.029391e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:49,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.66222 samples/s/p 2:50:56 } +2024-07-30 03:16:52,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2118/ 3125], loss: 0.295, per_step_time: 1412ms, lr: 9.027343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:52,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.66194 samples/s/p 2:50:53 } +2024-07-30 03:16:54,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2120/ 3125], loss: 0.335, per_step_time: 1413ms, lr: 9.025296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:54,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.66161 samples/s/p 2:50:51 } +2024-07-30 03:16:57,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2122/ 3125], loss: 0.121, per_step_time: 1412ms, lr: 9.023245e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:57,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.66175 samples/s/p 2:50:48 } +2024-07-30 03:17:00,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2124/ 3125], loss: 0.057, per_step_time: 1413ms, lr: 9.021193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:00,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.65916 samples/s/p 2:50:50 } +2024-07-30 03:17:03,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2126/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 9.019139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:03,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.66168 samples/s/p 2:50:42 } +2024-07-30 03:17:06,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2128/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 9.017082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:06,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.65961 samples/s/p 2:50:43 } +2024-07-30 03:17:09,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2130/ 3125], loss: 0.311, per_step_time: 1412ms, lr: 9.015024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:09,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.66174 samples/s/p 2:50:37 } +2024-07-30 03:17:11,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2132/ 3125], loss: 0.164, per_step_time: 1413ms, lr: 9.012964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:11,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.65877 samples/s/p 2:50:39 } +2024-07-30 03:17:14,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2134/ 3125], loss: 0.291, per_step_time: 1413ms, lr: 9.010902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:14,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.66017 samples/s/p 2:50:34 } +2024-07-30 03:17:17,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2136/ 3125], loss: 0.086, per_step_time: 1413ms, lr: 9.008838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:17,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.66013 samples/s/p 2:50:31 } +2024-07-30 03:17:20,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2138/ 3125], loss: 0.397, per_step_time: 1413ms, lr: 9.006773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:20,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.66168 samples/s/p 2:50:25 } +2024-07-30 03:17:23,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2140/ 3125], loss: 0.387, per_step_time: 1416ms, lr: 9.004705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:23,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.64830 samples/s/p 2:50:47 } +2024-07-30 03:17:26,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2142/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 9.002635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:26,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.65998 samples/s/p 2:50:23 } +2024-07-30 03:17:28,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2144/ 3125], loss: 0.336, per_step_time: 1415ms, lr: 9.000564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:28,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.65360 samples/s/p 2:50:32 } +2024-07-30 03:17:31,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2146/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 8.998491e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:31,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.66161 samples/s/p 2:50:14 } +2024-07-30 03:17:34,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2148/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 8.996415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:34,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.65972 samples/s/p 2:50:15 } +2024-07-30 03:17:37,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2150/ 3125], loss: 0.067, per_step_time: 1413ms, lr: 8.994339e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:37,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.66117 samples/s/p 2:50:09 } +2024-07-30 03:17:40,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2152/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 8.992258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:40,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.65877 samples/s/p 2:50:11 } +2024-07-30 03:17:43,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2154/ 3125], loss: 0.204, per_step_time: 1412ms, lr: 8.990178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:43,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.66210 samples/s/p 2:50:02 } +2024-07-30 03:17:45,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2156/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 8.988095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:45,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.65927 samples/s/p 2:50:04 } +2024-07-30 03:17:48,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2158/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 8.9860105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:48,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.65953 samples/s/p 2:50:01 } +2024-07-30 03:17:51,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2160/ 3125], loss: 0.406, per_step_time: 1412ms, lr: 8.983923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:51,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.66203 samples/s/p 2:49:54 } +2024-07-30 03:17:54,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2162/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 8.981835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:54,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.66001 samples/s/p 2:49:55 } +2024-07-30 03:17:57,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2164/ 3125], loss: 0.318, per_step_time: 1414ms, lr: 8.979744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:57,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.65598 samples/s/p 2:49:59 } +2024-07-30 03:18:00,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2166/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 8.977651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:00,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.66034 samples/s/p 2:49:48 } +2024-07-30 03:18:02,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2168/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 8.975558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:02,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.65818 samples/s/p 2:49:49 } +2024-07-30 03:18:05,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2170/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 8.973461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:05,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.66028 samples/s/p 2:49:43 } +2024-07-30 03:18:08,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2172/ 3125], loss: 0.114, per_step_time: 1413ms, lr: 8.971362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:08,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.65952 samples/s/p 2:49:41 } +2024-07-30 03:18:11,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2174/ 3125], loss: 0.497, per_step_time: 1413ms, lr: 8.969263e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:11,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.65847 samples/s/p 2:49:40 } +2024-07-30 03:18:14,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2176/ 3125], loss: 0.241, per_step_time: 1414ms, lr: 8.967161e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:14,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.65481 samples/s/p 2:49:44 } +2024-07-30 03:18:17,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2178/ 3125], loss: 0.211, per_step_time: 1414ms, lr: 8.9650575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:17,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.65616 samples/s/p 2:49:39 } +2024-07-30 03:18:19,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2180/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 8.962952e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:19,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.65789 samples/s/p 2:49:33 } +2024-07-30 03:18:22,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2182/ 3125], loss: 0.547, per_step_time: 1413ms, lr: 8.960844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:22,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.65944 samples/s/p 2:49:27 } +2024-07-30 03:18:25,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2184/ 3125], loss: 0.403, per_step_time: 1414ms, lr: 8.958734e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:25,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.65753 samples/s/p 2:49:28 } +2024-07-30 03:18:28,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2186/ 3125], loss: 0.458, per_step_time: 1414ms, lr: 8.956623e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:28,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.65671 samples/s/p 2:49:27 } +2024-07-30 03:18:31,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2188/ 3125], loss: 0.372, per_step_time: 1414ms, lr: 8.954509e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:31,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.65639 samples/s/p 2:49:24 } +2024-07-30 03:18:34,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2190/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 8.952395e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:34,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.66071 samples/s/p 2:49:14 } +2024-07-30 03:18:36,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2192/ 3125], loss: 0.120, per_step_time: 1413ms, lr: 8.950277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:36,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.66055 samples/s/p 2:49:11 } +2024-07-30 03:18:39,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2194/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 8.948158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:39,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.66108 samples/s/p 2:49:07 } +2024-07-30 03:18:42,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2196/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 8.946038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:42,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.66079 samples/s/p 2:49:05 } +2024-07-30 03:18:45,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2198/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 8.943915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:45,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.65996 samples/s/p 2:49:04 } +2024-07-30 03:18:48,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2200/ 3125], loss: 0.220, per_step_time: 1412ms, lr: 8.94179e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:48,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.66180 samples/s/p 2:48:58 } +2024-07-30 03:18:51,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2202/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 8.939664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:51,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.66075 samples/s/p 2:48:57 } +2024-07-30 03:18:53,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2204/ 3125], loss: 0.249, per_step_time: 1415ms, lr: 8.937535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:53,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.65256 samples/s/p 2:49:09 } +2024-07-30 03:18:56,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2206/ 3125], loss: 0.207, per_step_time: 1412ms, lr: 8.935404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:56,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.66223 samples/s/p 2:48:48 } +2024-07-30 03:18:59,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2208/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 8.9332725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:59,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.65914 samples/s/p 2:48:51 } +2024-07-30 03:19:02,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2210/ 3125], loss: 0.392, per_step_time: 1412ms, lr: 8.931139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:02,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.66396 samples/s/p 2:48:40 } +2024-07-30 03:19:05,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2212/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 8.929003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:05,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.65859 samples/s/p 2:48:46 } +2024-07-30 03:19:08,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2214/ 3125], loss: 0.446, per_step_time: 1415ms, lr: 8.926866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:08,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.65031 samples/s/p 2:48:58 } +2024-07-30 03:19:10,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2216/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 8.924726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:10,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.65921 samples/s/p 2:48:40 } +2024-07-30 03:19:13,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2218/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 8.922584e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:13,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.66169 samples/s/p 2:48:32 } +2024-07-30 03:19:16,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2220/ 3125], loss: 0.357, per_step_time: 1425ms, lr: 8.92044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:16,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.61307 samples/s/p 2:49:57 } +2024-07-30 03:19:19,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2222/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 8.918296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:19,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.65922 samples/s/p 2:48:31 } +2024-07-30 03:19:22,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2224/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 8.916148e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:22,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.66051 samples/s/p 2:48:26 } +2024-07-30 03:19:25,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2226/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 8.913999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:25,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.66127 samples/s/p 2:48:22 } +2024-07-30 03:19:27,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2228/ 3125], loss: 0.122, per_step_time: 1413ms, lr: 8.911848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:27,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.66054 samples/s/p 2:48:20 } +2024-07-30 03:19:30,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2230/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 8.909696e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:30,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.65947 samples/s/p 2:48:19 } +2024-07-30 03:19:33,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2232/ 3125], loss: 0.463, per_step_time: 1413ms, lr: 8.907542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:33,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.65835 samples/s/p 2:48:19 } +2024-07-30 03:19:36,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2234/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 8.905385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:36,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.65823 samples/s/p 2:48:16 } +2024-07-30 03:19:39,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2236/ 3125], loss: 0.187, per_step_time: 1416ms, lr: 8.903226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:39,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.64603 samples/s/p 2:48:35 } +2024-07-30 03:19:42,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2238/ 3125], loss: 0.119, per_step_time: 1414ms, lr: 8.901066e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:42,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.65667 samples/s/p 2:48:13 } +2024-07-30 03:19:45,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2240/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 8.8989045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:45,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.65962 samples/s/p 2:48:05 } +2024-07-30 03:19:47,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2242/ 3125], loss: 0.383, per_step_time: 1413ms, lr: 8.896741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:47,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.66015 samples/s/p 2:48:01 } +2024-07-30 03:19:50,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2244/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 8.894574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:50,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.66083 samples/s/p 2:47:57 } +2024-07-30 03:19:53,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2246/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 8.892407e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:53,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |███████████ | 5.66007 samples/s/p 2:47:56 } +2024-07-30 03:19:56,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2248/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 8.890238e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:56,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |███████████ | 5.66014 samples/s/p 2:47:53 } +2024-07-30 03:19:59,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2250/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 8.888067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:59,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.66031 samples/s/p 2:47:50 } +2024-07-30 03:20:02,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2252/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 8.885892e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:02,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.66048 samples/s/p 2:47:46 } +2024-07-30 03:20:04,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2254/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 8.883718e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:04,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.66078 samples/s/p 2:47:43 } +2024-07-30 03:20:07,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2256/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 8.881541e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:07,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.65873 samples/s/p 2:47:44 } +2024-07-30 03:20:10,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2258/ 3125], loss: 0.159, per_step_time: 1416ms, lr: 8.879362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:10,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.64871 samples/s/p 2:47:59 } +2024-07-30 03:20:13,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2260/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 8.877181e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:13,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.65961 samples/s/p 2:47:37 } +2024-07-30 03:20:16,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2262/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 8.874999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:16,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.66080 samples/s/p 2:47:32 } +2024-07-30 03:20:19,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2264/ 3125], loss: 0.264, per_step_time: 1414ms, lr: 8.872815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:19,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.65670 samples/s/p 2:47:36 } +2024-07-30 03:20:21,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2266/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 8.870629e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:21,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.66112 samples/s/p 2:47:26 } +2024-07-30 03:20:24,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2268/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.86844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:24,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.66025 samples/s/p 2:47:24 } +2024-07-30 03:20:27,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2270/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 8.86625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:27,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.66098 samples/s/p 2:47:20 } +2024-07-30 03:20:30,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2272/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 8.864059e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:30,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.65801 samples/s/p 2:47:23 } +2024-07-30 03:20:33,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2274/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 8.861865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:33,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.66152 samples/s/p 2:47:14 } +2024-07-30 03:20:36,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2276/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 8.85967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:36,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.65951 samples/s/p 2:47:14 } +2024-07-30 03:20:38,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2278/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 8.8574725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:38,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.65977 samples/s/p 2:47:11 } +2024-07-30 03:20:41,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2280/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 8.855273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:41,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.65811 samples/s/p 2:47:11 } +2024-07-30 03:20:44,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2282/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 8.853073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:44,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.66099 samples/s/p 2:47:03 } +2024-07-30 03:20:47,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2284/ 3125], loss: 0.197, per_step_time: 1414ms, lr: 8.85087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:47,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.65707 samples/s/p 2:47:07 } +2024-07-30 03:20:50,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2286/ 3125], loss: 0.174, per_step_time: 1414ms, lr: 8.848665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:50,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.65487 samples/s/p 2:47:08 } +2024-07-30 03:20:53,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2288/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 8.8464585e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:53,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.66121 samples/s/p 2:46:54 } +2024-07-30 03:20:55,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2290/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 8.84425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:55,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.66141 samples/s/p 2:46:51 } +2024-07-30 03:20:58,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2292/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 8.842041e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:58,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.65856 samples/s/p 2:46:53 } +2024-07-30 03:21:01,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2294/ 3125], loss: 0.151, per_step_time: 1414ms, lr: 8.839828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:01,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.65697 samples/s/p 2:46:53 } +2024-07-30 03:21:04,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2296/ 3125], loss: 0.295, per_step_time: 1414ms, lr: 8.837615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:04,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.65756 samples/s/p 2:46:49 } +2024-07-30 03:21:07,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2298/ 3125], loss: 0.244, per_step_time: 1414ms, lr: 8.835399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:07,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.65457 samples/s/p 2:46:52 } +2024-07-30 03:21:10,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2300/ 3125], loss: 0.378, per_step_time: 1415ms, lr: 8.833182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:10,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.65307 samples/s/p 2:46:52 } +2024-07-30 03:21:12,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2302/ 3125], loss: 0.556, per_step_time: 1413ms, lr: 8.8309625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:12,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.65856 samples/s/p 2:46:39 } +2024-07-30 03:21:15,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2304/ 3125], loss: 0.383, per_step_time: 1413ms, lr: 8.828741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:15,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.65864 samples/s/p 2:46:36 } +2024-07-30 03:21:18,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2306/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 8.826519e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:18,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.65838 samples/s/p 2:46:34 } +2024-07-30 03:21:21,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2308/ 3125], loss: 0.211, per_step_time: 1415ms, lr: 8.824293e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:21,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.65254 samples/s/p 2:46:41 } +2024-07-30 03:21:24,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2310/ 3125], loss: 0.327, per_step_time: 1412ms, lr: 8.822068e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:24,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.66206 samples/s/p 2:46:22 } +2024-07-30 03:21:27,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2312/ 3125], loss: 0.224, per_step_time: 1416ms, lr: 8.8198385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:27,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.64921 samples/s/p 2:46:42 } +2024-07-30 03:21:29,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2314/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 8.817608e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:29,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.66143 samples/s/p 2:46:17 } +2024-07-30 03:21:32,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2316/ 3125], loss: 0.142, per_step_time: 1412ms, lr: 8.8153765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:32,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.66226 samples/s/p 2:46:13 } +2024-07-30 03:21:35,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2318/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 8.813143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:35,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.65958 samples/s/p 2:46:15 } +2024-07-30 03:21:38,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2320/ 3125], loss: 0.192, per_step_time: 1412ms, lr: 8.810907e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:38,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.66270 samples/s/p 2:46:06 } +2024-07-30 03:21:41,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2322/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 8.808669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:41,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.66115 samples/s/p 2:46:06 } +2024-07-30 03:21:44,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2324/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.80643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:44,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.65938 samples/s/p 2:46:07 } +2024-07-30 03:21:46,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2326/ 3125], loss: 0.665, per_step_time: 1413ms, lr: 8.804189e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:46,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.66103 samples/s/p 2:46:01 } +2024-07-30 03:21:49,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2328/ 3125], loss: 0.223, per_step_time: 1414ms, lr: 8.801945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:49,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.65746 samples/s/p 2:46:04 } +2024-07-30 03:21:52,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2330/ 3125], loss: 0.517, per_step_time: 1413ms, lr: 8.7997005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:52,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.66023 samples/s/p 2:45:57 } +2024-07-30 03:21:55,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2332/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 8.797455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:55,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.65976 samples/s/p 2:45:55 } +2024-07-30 03:21:58,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2334/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 8.795207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:58,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.66012 samples/s/p 2:45:51 } +2024-07-30 03:22:01,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2336/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 8.792956e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:01,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.66009 samples/s/p 2:45:48 } +2024-07-30 03:22:03,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2338/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 8.790704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:03,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.65957 samples/s/p 2:45:47 } +2024-07-30 03:22:06,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2340/ 3125], loss: 0.059, per_step_time: 1413ms, lr: 8.788449e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:06,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.66073 samples/s/p 2:45:42 } +2024-07-30 03:22:09,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2342/ 3125], loss: 0.110, per_step_time: 1412ms, lr: 8.7861945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:09,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.66201 samples/s/p 2:45:37 } +2024-07-30 03:22:12,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2344/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 8.783937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:12,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.66145 samples/s/p 2:45:35 } +2024-07-30 03:22:15,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2346/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 8.781677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:15,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.66087 samples/s/p 2:45:33 } +2024-07-30 03:22:18,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2348/ 3125], loss: 0.086, per_step_time: 1413ms, lr: 8.779416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:18,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.65866 samples/s/p 2:45:34 } +2024-07-30 03:22:20,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2350/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 8.777153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:20,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.65827 samples/s/p 2:45:32 } +2024-07-30 03:22:23,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2352/ 3125], loss: 0.291, per_step_time: 1413ms, lr: 8.774889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:23,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.66099 samples/s/p 2:45:24 } +2024-07-30 03:22:26,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2354/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 8.772622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:26,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.66082 samples/s/p 2:45:22 } +2024-07-30 03:22:29,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2356/ 3125], loss: 0.190, per_step_time: 1414ms, lr: 8.770355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:29,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.65627 samples/s/p 2:45:27 } +2024-07-30 03:22:32,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2358/ 3125], loss: 0.312, per_step_time: 1415ms, lr: 8.768084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:32,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.65287 samples/s/p 2:45:30 } +2024-07-30 03:22:35,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2360/ 3125], loss: 0.515, per_step_time: 1413ms, lr: 8.765812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:35,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.66144 samples/s/p 2:45:12 } +2024-07-30 03:22:37,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2362/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 8.763538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:37,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.65880 samples/s/p 2:45:14 } +2024-07-30 03:22:40,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2364/ 3125], loss: 0.183, per_step_time: 1419ms, lr: 8.7612625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:40,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.63686 samples/s/p 2:45:50 } +2024-07-30 03:22:43,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2366/ 3125], loss: 0.127, per_step_time: 1412ms, lr: 8.758985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:43,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.66218 samples/s/p 2:45:02 } +2024-07-30 03:22:46,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2368/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 8.756707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:46,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.65858 samples/s/p 2:45:06 } +2024-07-30 03:22:49,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2370/ 3125], loss: 0.141, per_step_time: 1413ms, lr: 8.754426e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:49,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.65920 samples/s/p 2:45:02 } +2024-07-30 03:22:52,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2372/ 3125], loss: 0.340, per_step_time: 1414ms, lr: 8.752143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:52,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.65528 samples/s/p 2:45:06 } +2024-07-30 03:22:54,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2374/ 3125], loss: 0.473, per_step_time: 1417ms, lr: 8.749858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:54,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.64326 samples/s/p 2:45:24 } +2024-07-30 03:22:57,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2376/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 8.747572e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:57,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.65960 samples/s/p 2:44:53 } +2024-07-30 03:23:00,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2378/ 3125], loss: 0.094, per_step_time: 1413ms, lr: 8.745284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:00,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.65813 samples/s/p 2:44:53 } +2024-07-30 03:23:03,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2380/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 8.7429935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:03,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.65826 samples/s/p 2:44:49 } +2024-07-30 03:23:06,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2382/ 3125], loss: 0.261, per_step_time: 1412ms, lr: 8.7407025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:06,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.66270 samples/s/p 2:44:39 } +2024-07-30 03:23:09,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2384/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 8.738409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:09,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.65949 samples/s/p 2:44:42 } +2024-07-30 03:23:11,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2386/ 3125], loss: 0.167, per_step_time: 1412ms, lr: 8.736114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:11,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.66257 samples/s/p 2:44:33 } +2024-07-30 03:23:14,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2388/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 8.733817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:14,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.66159 samples/s/p 2:44:32 } +2024-07-30 03:23:17,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2390/ 3125], loss: 0.474, per_step_time: 1412ms, lr: 8.731518e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:17,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.66216 samples/s/p 2:44:29 } +2024-07-30 03:23:20,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2392/ 3125], loss: 0.226, per_step_time: 1412ms, lr: 8.729217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:20,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.66178 samples/s/p 2:44:26 } +2024-07-30 03:23:23,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2394/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 8.726915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:23,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.66052 samples/s/p 2:44:26 } +2024-07-30 03:23:26,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2396/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 8.724612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:26,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.65902 samples/s/p 2:44:26 } +2024-07-30 03:23:28,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2398/ 3125], loss: 0.353, per_step_time: 1413ms, lr: 8.722305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:28,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.66004 samples/s/p 2:44:21 } +2024-07-30 03:23:31,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2400/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 8.719997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:31,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.65909 samples/s/p 2:44:20 } +2024-07-30 03:23:34,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2402/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 8.717688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:34,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.65930 samples/s/p 2:44:17 } +2024-07-30 03:23:37,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2404/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 8.715378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:37,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.65954 samples/s/p 2:44:13 } +2024-07-30 03:23:40,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2406/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 8.713065e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:40,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.66115 samples/s/p 2:44:08 } +2024-07-30 03:23:43,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2408/ 3125], loss: 0.264, per_step_time: 1415ms, lr: 8.710749e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:43,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.65035 samples/s/p 2:44:24 } +2024-07-30 03:23:45,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2410/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 8.708433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:45,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.66101 samples/s/p 2:44:02 } +2024-07-30 03:23:48,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2412/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 8.706115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:48,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.66019 samples/s/p 2:44:01 } +2024-07-30 03:23:51,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2414/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 8.703795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:51,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.66160 samples/s/p 2:43:56 } +2024-07-30 03:23:54,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2416/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 8.701472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:54,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.66105 samples/s/p 2:43:54 } +2024-07-30 03:23:57,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2418/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 8.699149e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:57,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.66050 samples/s/p 2:43:52 } +2024-07-30 03:24:00,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2420/ 3125], loss: 0.363, per_step_time: 1413ms, lr: 8.696824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:00,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.65983 samples/s/p 2:43:50 } +2024-07-30 03:24:02,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2422/ 3125], loss: 0.210, per_step_time: 1415ms, lr: 8.694497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:02,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.65252 samples/s/p 2:44:00 } +2024-07-30 03:24:05,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2424/ 3125], loss: 0.583, per_step_time: 1414ms, lr: 8.692168e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:05,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.65723 samples/s/p 2:43:49 } +2024-07-30 03:24:08,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2426/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 8.689837e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:08,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.66167 samples/s/p 2:43:39 } +2024-07-30 03:24:11,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2428/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 8.687505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:11,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.66085 samples/s/p 2:43:37 } +2024-07-30 03:24:14,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2430/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 8.6851705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:14,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.66161 samples/s/p 2:43:33 } +2024-07-30 03:24:17,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2432/ 3125], loss: 0.409, per_step_time: 1415ms, lr: 8.682835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:17,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.65309 samples/s/p 2:43:45 } +2024-07-30 03:24:19,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2434/ 3125], loss: 0.359, per_step_time: 1412ms, lr: 8.680497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:19,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |████████████ | 5.66203 samples/s/p 2:43:27 } +2024-07-30 03:24:22,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2436/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 8.678157e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:22,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |████████████ | 5.65817 samples/s/p 2:43:30 } +2024-07-30 03:24:25,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2438/ 3125], loss: 0.460, per_step_time: 1414ms, lr: 8.675816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:25,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.65683 samples/s/p 2:43:30 } +2024-07-30 03:24:28,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2440/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 8.6734735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:28,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.65934 samples/s/p 2:43:23 } +2024-07-30 03:24:31,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2442/ 3125], loss: 0.319, per_step_time: 1414ms, lr: 8.671129e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:31,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.65734 samples/s/p 2:43:23 } +2024-07-30 03:24:34,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2444/ 3125], loss: 0.472, per_step_time: 1413ms, lr: 8.668782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:34,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.66081 samples/s/p 2:43:15 } +2024-07-30 03:24:36,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2446/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 8.666434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:36,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.65852 samples/s/p 2:43:16 } +2024-07-30 03:24:39,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2448/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 8.664085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:39,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.65944 samples/s/p 2:43:11 } +2024-07-30 03:24:42,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2450/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 8.661733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:42,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.65954 samples/s/p 2:43:08 } +2024-07-30 03:24:45,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2452/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 8.659379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:45,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.65931 samples/s/p 2:43:06 } +2024-07-30 03:24:48,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2454/ 3125], loss: 0.155, per_step_time: 1414ms, lr: 8.6570235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:48,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.65512 samples/s/p 2:43:10 } +2024-07-30 03:24:51,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2456/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 8.654667e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:51,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.66098 samples/s/p 2:42:57 } +2024-07-30 03:24:53,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2458/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 8.652309e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:53,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.65882 samples/s/p 2:42:58 } +2024-07-30 03:24:56,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2460/ 3125], loss: 0.457, per_step_time: 1413ms, lr: 8.649948e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:56,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.66101 samples/s/p 2:42:52 } +2024-07-30 03:24:59,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2462/ 3125], loss: 0.426, per_step_time: 1413ms, lr: 8.647586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:59,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.65935 samples/s/p 2:42:52 } +2024-07-30 03:25:02,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2464/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 8.645222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:02,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.66068 samples/s/p 2:42:47 } +2024-07-30 03:25:05,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2466/ 3125], loss: 0.425, per_step_time: 1412ms, lr: 8.642855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:05,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.66256 samples/s/p 2:42:40 } +2024-07-30 03:25:08,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2468/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 8.640488e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:08,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.65830 samples/s/p 2:42:45 } +2024-07-30 03:25:10,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2470/ 3125], loss: 0.217, per_step_time: 1414ms, lr: 8.638119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:10,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.65753 samples/s/p 2:42:43 } +2024-07-30 03:25:13,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2472/ 3125], loss: 0.181, per_step_time: 1414ms, lr: 8.635749e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:13,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.65512 samples/s/p 2:42:45 } +2024-07-30 03:25:16,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2474/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 8.633376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:16,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.65856 samples/s/p 2:42:36 } +2024-07-30 03:25:19,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2476/ 3125], loss: 0.425, per_step_time: 1414ms, lr: 8.631002e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:19,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.65539 samples/s/p 2:42:39 } +2024-07-30 03:25:22,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2478/ 3125], loss: 0.303, per_step_time: 1414ms, lr: 8.628625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:22,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.65623 samples/s/p 2:42:34 } +2024-07-30 03:25:25,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2480/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 8.626247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:25,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.65979 samples/s/p 2:42:25 } +2024-07-30 03:25:27,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2482/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 8.623868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:27,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.65986 samples/s/p 2:42:22 } +2024-07-30 03:25:30,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2484/ 3125], loss: 0.112, per_step_time: 1412ms, lr: 8.621487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:30,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.66204 samples/s/p 2:42:16 } +2024-07-30 03:25:33,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2486/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 8.619103e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:33,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.66142 samples/s/p 2:42:14 } +2024-07-30 03:25:36,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2488/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 8.616719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:36,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.65946 samples/s/p 2:42:15 } +2024-07-30 03:25:39,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2490/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 8.614333e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:39,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.65777 samples/s/p 2:42:15 } +2024-07-30 03:25:42,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2492/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 8.611944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:42,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.65894 samples/s/p 2:42:10 } +2024-07-30 03:25:44,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2494/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 8.609554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:44,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.65975 samples/s/p 2:42:06 } +2024-07-30 03:25:47,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2496/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 8.607162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:47,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.65965 samples/s/p 2:42:03 } +2024-07-30 03:25:50,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2498/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.6047685e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:50,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.65891 samples/s/p 2:42:02 } +2024-07-30 03:25:53,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2500/ 3125], loss: 0.103, per_step_time: 1413ms, lr: 8.602375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:53,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.66013 samples/s/p 2:41:57 } +2024-07-30 03:25:56,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2502/ 3125], loss: 0.338, per_step_time: 1414ms, lr: 8.599976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:56,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.65589 samples/s/p 2:42:01 } +2024-07-30 03:25:59,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2504/ 3125], loss: 0.336, per_step_time: 1414ms, lr: 8.597579e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:59,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.65730 samples/s/p 2:41:56 } +2024-07-30 03:26:01,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2506/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 8.595178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:01,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.66051 samples/s/p 2:41:47 } +2024-07-30 03:26:04,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2508/ 3125], loss: 0.387, per_step_time: 1413ms, lr: 8.592777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:04,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.66054 samples/s/p 2:41:45 } +2024-07-30 03:26:07,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2510/ 3125], loss: 0.373, per_step_time: 1413ms, lr: 8.590373e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:07,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.66109 samples/s/p 2:41:41 } +2024-07-30 03:26:10,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2512/ 3125], loss: 0.230, per_step_time: 1416ms, lr: 8.587968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:10,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.64950 samples/s/p 2:41:58 } +2024-07-30 03:26:13,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2514/ 3125], loss: 0.258, per_step_time: 1415ms, lr: 8.58556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:13,310 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.65357 samples/s/p 2:41:48 } +2024-07-30 03:26:16,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2516/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 8.5831525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:16,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.66009 samples/s/p 2:41:34 } +2024-07-30 03:26:18,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2518/ 3125], loss: 0.340, per_step_time: 1414ms, lr: 8.580741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:18,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.65696 samples/s/p 2:41:37 } +2024-07-30 03:26:21,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2520/ 3125], loss: 0.080, per_step_time: 1413ms, lr: 8.578329e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:21,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.66044 samples/s/p 2:41:28 } +2024-07-30 03:26:24,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2522/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 8.575915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:24,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.66007 samples/s/p 2:41:26 } +2024-07-30 03:26:27,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2524/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 8.573499e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:27,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.65871 samples/s/p 2:41:25 } +2024-07-30 03:26:30,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2526/ 3125], loss: 0.306, per_step_time: 1412ms, lr: 8.571082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:30,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.66223 samples/s/p 2:41:16 } +2024-07-30 03:26:33,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2528/ 3125], loss: 0.300, per_step_time: 1414ms, lr: 8.568663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:33,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.65576 samples/s/p 2:41:24 } +2024-07-30 03:26:35,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2530/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 8.566242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:35,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.65941 samples/s/p 2:41:15 } +2024-07-30 03:26:38,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2532/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 8.563819e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:38,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.65945 samples/s/p 2:41:13 } +2024-07-30 03:26:41,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2534/ 3125], loss: 0.080, per_step_time: 1413ms, lr: 8.561396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:41,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.66040 samples/s/p 2:41:08 } +2024-07-30 03:26:44,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2536/ 3125], loss: 0.029, per_step_time: 1412ms, lr: 8.55897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:44,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.66221 samples/s/p 2:41:02 } +2024-07-30 03:26:47,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2538/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 8.556542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:47,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.66045 samples/s/p 2:41:02 } +2024-07-30 03:26:50,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2540/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 8.554112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:50,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.66019 samples/s/p 2:41:00 } +2024-07-30 03:26:52,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2542/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 8.551682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:52,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.66027 samples/s/p 2:40:57 } +2024-07-30 03:26:55,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2544/ 3125], loss: 0.513, per_step_time: 1412ms, lr: 8.549249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:55,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.66194 samples/s/p 2:40:51 } +2024-07-30 03:26:58,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2546/ 3125], loss: 0.527, per_step_time: 1413ms, lr: 8.546815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:58,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.65951 samples/s/p 2:40:53 } +2024-07-30 03:27:01,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2548/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 8.544379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:01,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.66079 samples/s/p 2:40:48 } +2024-07-30 03:27:04,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2550/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 8.541941e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:04,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.65882 samples/s/p 2:40:48 } +2024-07-30 03:27:07,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2552/ 3125], loss: 0.393, per_step_time: 1413ms, lr: 8.539501e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:07,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.65910 samples/s/p 2:40:45 } +2024-07-30 03:27:09,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2554/ 3125], loss: 0.224, per_step_time: 1412ms, lr: 8.537061e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:09,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.66197 samples/s/p 2:40:37 } +2024-07-30 03:27:12,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2556/ 3125], loss: 0.344, per_step_time: 1415ms, lr: 8.534618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:12,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.65294 samples/s/p 2:40:50 } +2024-07-30 03:27:15,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2558/ 3125], loss: 0.511, per_step_time: 1414ms, lr: 8.532173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:15,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.65588 samples/s/p 2:40:42 } +2024-07-30 03:27:18,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2560/ 3125], loss: 0.267, per_step_time: 1414ms, lr: 8.529727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:18,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.65734 samples/s/p 2:40:37 } +2024-07-30 03:27:21,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2562/ 3125], loss: 0.235, per_step_time: 1413ms, lr: 8.5272795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:21,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.65986 samples/s/p 2:40:29 } +2024-07-30 03:27:24,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2564/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 8.52483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:24,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.65930 samples/s/p 2:40:28 } +2024-07-30 03:27:26,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2566/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 8.522378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:26,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.65887 samples/s/p 2:40:25 } +2024-07-30 03:27:29,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2568/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 8.519925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:29,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.65983 samples/s/p 2:40:21 } +2024-07-30 03:27:32,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2570/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 8.517471e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:32,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.66074 samples/s/p 2:40:17 } +2024-07-30 03:27:35,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2572/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 8.515014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:35,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.65912 samples/s/p 2:40:17 } +2024-07-30 03:27:38,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2574/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 8.512557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:38,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.66071 samples/s/p 2:40:11 } +2024-07-30 03:27:41,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2576/ 3125], loss: 0.606, per_step_time: 1414ms, lr: 8.510097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:41,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.65445 samples/s/p 2:40:19 } +2024-07-30 03:27:43,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2578/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 8.507635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:44,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.66129 samples/s/p 2:40:04 } +2024-07-30 03:27:46,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2580/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 8.505172e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:46,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.66083 samples/s/p 2:40:02 } +2024-07-30 03:27:49,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2582/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 8.502709e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:49,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.66053 samples/s/p 2:40:00 } +2024-07-30 03:27:52,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2584/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 8.500242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:52,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.65863 samples/s/p 2:40:00 } +2024-07-30 03:27:55,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2586/ 3125], loss: 0.349, per_step_time: 1413ms, lr: 8.497773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:55,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.65779 samples/s/p 2:39:59 } +2024-07-30 03:27:58,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2588/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 8.495304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:58,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.66072 samples/s/p 2:39:51 } +2024-07-30 03:28:01,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2590/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 8.492833e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:01,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.65940 samples/s/p 2:39:51 } +2024-07-30 03:28:03,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2592/ 3125], loss: 0.391, per_step_time: 1413ms, lr: 8.4903595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:03,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.66084 samples/s/p 2:39:45 } +2024-07-30 03:28:06,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2594/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 8.487885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:06,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.65995 samples/s/p 2:39:44 } +2024-07-30 03:28:09,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2596/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.485409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:09,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.66079 samples/s/p 2:39:40 } +2024-07-30 03:28:12,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2598/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 8.482931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:12,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.66100 samples/s/p 2:39:37 } +2024-07-30 03:28:15,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2600/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 8.480451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:15,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.65913 samples/s/p 2:39:37 } +2024-07-30 03:28:18,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2602/ 3125], loss: 0.205, per_step_time: 1414ms, lr: 8.477969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:18,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.65585 samples/s/p 2:39:40 } +2024-07-30 03:28:20,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2604/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 8.4754865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:20,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.65960 samples/s/p 2:39:31 } +2024-07-30 03:28:23,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2606/ 3125], loss: 0.323, per_step_time: 1424ms, lr: 8.473002e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:23,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.61452 samples/s/p 2:40:44 } +2024-07-30 03:28:26,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2608/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 8.470515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:26,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.66039 samples/s/p 2:39:24 } +2024-07-30 03:28:29,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2610/ 3125], loss: 0.296, per_step_time: 1412ms, lr: 8.468027e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:29,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.66241 samples/s/p 2:39:17 } +2024-07-30 03:28:32,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2612/ 3125], loss: 0.131, per_step_time: 1414ms, lr: 8.465538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:32,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.65733 samples/s/p 2:39:23 } +2024-07-30 03:28:35,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2614/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 8.4630465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:35,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.65895 samples/s/p 2:39:17 } +2024-07-30 03:28:37,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2616/ 3125], loss: 0.234, per_step_time: 1414ms, lr: 8.4605535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:37,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.65757 samples/s/p 2:39:17 } +2024-07-30 03:28:40,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2618/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 8.45806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:40,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.66131 samples/s/p 2:39:08 } +2024-07-30 03:28:43,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2620/ 3125], loss: 0.403, per_step_time: 1414ms, lr: 8.455562e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:43,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.65726 samples/s/p 2:39:12 } +2024-07-30 03:28:46,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2622/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 8.453065e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:46,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |█████████████ | 5.65819 samples/s/p 2:39:07 } +2024-07-30 03:28:49,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2624/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 8.4505655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:49,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |█████████████ | 5.65974 samples/s/p 2:39:02 } +2024-07-30 03:28:52,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2626/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 8.448064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:52,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.66145 samples/s/p 2:38:56 } +2024-07-30 03:28:54,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2628/ 3125], loss: 0.112, per_step_time: 1414ms, lr: 8.445561e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:54,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.65533 samples/s/p 2:39:04 } +2024-07-30 03:28:57,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2630/ 3125], loss: 0.297, per_step_time: 1412ms, lr: 8.443058e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:57,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.66174 samples/s/p 2:38:50 } +2024-07-30 03:29:00,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2632/ 3125], loss: 0.303, per_step_time: 1415ms, lr: 8.440551e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:00,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.65338 samples/s/p 2:39:01 } +2024-07-30 03:29:03,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2634/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.438044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:03,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.66146 samples/s/p 2:38:45 } +2024-07-30 03:29:06,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2636/ 3125], loss: 0.294, per_step_time: 1412ms, lr: 8.435534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:06,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.66209 samples/s/p 2:38:41 } +2024-07-30 03:29:09,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2638/ 3125], loss: 0.058, per_step_time: 1415ms, lr: 8.433022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:09,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.65181 samples/s/p 2:38:56 } +2024-07-30 03:29:11,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2640/ 3125], loss: 0.218, per_step_time: 1412ms, lr: 8.43051e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:11,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.66310 samples/s/p 2:38:34 } +2024-07-30 03:29:14,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2642/ 3125], loss: 0.335, per_step_time: 1413ms, lr: 8.427995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:14,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.66037 samples/s/p 2:38:35 } +2024-07-30 03:29:17,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2644/ 3125], loss: 0.282, per_step_time: 1416ms, lr: 8.425479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:17,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.64763 samples/s/p 2:38:54 } +2024-07-30 03:29:20,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2646/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 8.422962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:20,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.65803 samples/s/p 2:38:34 } +2024-07-30 03:29:23,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2648/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 8.420443e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:23,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.65900 samples/s/p 2:38:29 } +2024-07-30 03:29:26,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2650/ 3125], loss: 0.492, per_step_time: 1414ms, lr: 8.417922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:26,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.65734 samples/s/p 2:38:29 } +2024-07-30 03:29:28,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2652/ 3125], loss: 0.169, per_step_time: 1416ms, lr: 8.4154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:28,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.64741 samples/s/p 2:38:43 } +2024-07-30 03:29:31,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2654/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 8.412875e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:31,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.65802 samples/s/p 2:38:22 } +2024-07-30 03:29:34,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2656/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 8.410349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:34,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.66151 samples/s/p 2:38:14 } +2024-07-30 03:29:37,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2658/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 8.407823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:37,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.66043 samples/s/p 2:38:13 } +2024-07-30 03:29:40,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2660/ 3125], loss: 0.666, per_step_time: 1413ms, lr: 8.405293e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:40,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.66042 samples/s/p 2:38:10 } +2024-07-30 03:29:43,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2662/ 3125], loss: 0.224, per_step_time: 1414ms, lr: 8.402762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:43,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.65716 samples/s/p 2:38:13 } +2024-07-30 03:29:45,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2664/ 3125], loss: 0.433, per_step_time: 1413ms, lr: 8.40023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:45,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.65829 samples/s/p 2:38:08 } +2024-07-30 03:29:48,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2666/ 3125], loss: 0.185, per_step_time: 1414ms, lr: 8.397697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:48,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.65740 samples/s/p 2:38:07 } +2024-07-30 03:29:51,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2668/ 3125], loss: 0.216, per_step_time: 1414ms, lr: 8.395162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:51,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.65421 samples/s/p 2:38:09 } +2024-07-30 03:29:54,405 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2670/ 3125], loss: 0.426, per_step_time: 1413ms, lr: 8.392624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:54,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.65808 samples/s/p 2:38:00 } +2024-07-30 03:29:57,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2672/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 8.390086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:57,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.65984 samples/s/p 2:37:54 } +2024-07-30 03:30:00,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2674/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 8.387545e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:00,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.66133 samples/s/p 2:37:49 } +2024-07-30 03:30:02,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2676/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 8.385003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:02,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.66145 samples/s/p 2:37:46 } +2024-07-30 03:30:05,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2678/ 3125], loss: 0.156, per_step_time: 1414ms, lr: 8.38246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:05,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.65723 samples/s/p 2:37:50 } +2024-07-30 03:30:08,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2680/ 3125], loss: 0.206, per_step_time: 1412ms, lr: 8.379913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:08,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.66226 samples/s/p 2:37:39 } +2024-07-30 03:30:11,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2682/ 3125], loss: 0.554, per_step_time: 1413ms, lr: 8.377367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:11,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.66131 samples/s/p 2:37:37 } +2024-07-30 03:30:14,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2684/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 8.374818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:14,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.65959 samples/s/p 2:37:37 } +2024-07-30 03:30:17,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2686/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 8.372269e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:17,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.66170 samples/s/p 2:37:31 } +2024-07-30 03:30:19,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2688/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 8.369716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:19,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.65928 samples/s/p 2:37:32 } +2024-07-30 03:30:22,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2690/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 8.367164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:22,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.66038 samples/s/p 2:37:28 } +2024-07-30 03:30:25,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2692/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 8.364609e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:25,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.65909 samples/s/p 2:37:27 } +2024-07-30 03:30:28,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2694/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 8.3620525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:28,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.66046 samples/s/p 2:37:22 } +2024-07-30 03:30:31,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2696/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 8.359494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:31,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.65955 samples/s/p 2:37:21 } +2024-07-30 03:30:34,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2698/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 8.356935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:34,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.65833 samples/s/p 2:37:20 } +2024-07-30 03:30:36,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2700/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 8.354374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:36,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.65984 samples/s/p 2:37:14 } +2024-07-30 03:30:39,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2702/ 3125], loss: 0.419, per_step_time: 1414ms, lr: 8.351811e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:39,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.65727 samples/s/p 2:37:16 } +2024-07-30 03:30:42,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2704/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 8.349247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:42,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.66052 samples/s/p 2:37:08 } +2024-07-30 03:30:45,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2706/ 3125], loss: 0.157, per_step_time: 1412ms, lr: 8.34668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:45,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.66177 samples/s/p 2:37:03 } +2024-07-30 03:30:48,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2708/ 3125], loss: 0.245, per_step_time: 1418ms, lr: 8.344113e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:48,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.63896 samples/s/p 2:37:38 } +2024-07-30 03:30:51,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2710/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 8.3415425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:51,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.66042 samples/s/p 2:36:59 } +2024-07-30 03:30:53,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2712/ 3125], loss: 0.291, per_step_time: 1414ms, lr: 8.338972e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:53,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.65715 samples/s/p 2:37:02 } +2024-07-30 03:30:56,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2714/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 8.336399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:56,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.65988 samples/s/p 2:36:55 } +2024-07-30 03:30:59,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2716/ 3125], loss: 0.380, per_step_time: 1414ms, lr: 8.3338255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:59,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.65480 samples/s/p 2:37:00 } +2024-07-30 03:31:02,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2718/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 8.33125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:02,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.65680 samples/s/p 2:36:54 } +2024-07-30 03:31:05,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2720/ 3125], loss: 0.154, per_step_time: 1415ms, lr: 8.328672e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:05,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.65055 samples/s/p 2:37:02 } +2024-07-30 03:31:08,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2722/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 8.326094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:08,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.66079 samples/s/p 2:36:42 } +2024-07-30 03:31:10,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2724/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 8.323513e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:10,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.66075 samples/s/p 2:36:39 } +2024-07-30 03:31:13,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2726/ 3125], loss: 0.214, per_step_time: 1412ms, lr: 8.320931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:13,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.66254 samples/s/p 2:36:33 } +2024-07-30 03:31:16,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2728/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 8.318348e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:16,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.66047 samples/s/p 2:36:34 } +2024-07-30 03:31:19,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2730/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 8.315763e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:19,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.66092 samples/s/p 2:36:30 } +2024-07-30 03:31:22,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2732/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 8.313175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:22,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.65987 samples/s/p 2:36:29 } +2024-07-30 03:31:25,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2734/ 3125], loss: 0.185, per_step_time: 1412ms, lr: 8.310587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:25,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.66304 samples/s/p 2:36:21 } +2024-07-30 03:31:27,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2736/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 8.307998e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:27,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.65891 samples/s/p 2:36:25 } +2024-07-30 03:31:30,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2738/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 8.3054065e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:30,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.65836 samples/s/p 2:36:23 } +2024-07-30 03:31:33,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2740/ 3125], loss: 0.346, per_step_time: 1416ms, lr: 8.3028135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:33,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.64608 samples/s/p 2:36:41 } +2024-07-30 03:31:36,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2742/ 3125], loss: 0.103, per_step_time: 1413ms, lr: 8.300218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:36,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.65968 samples/s/p 2:36:15 } +2024-07-30 03:31:39,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2744/ 3125], loss: 0.310, per_step_time: 1416ms, lr: 8.297622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:39,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.64576 samples/s/p 2:36:36 } +2024-07-30 03:31:42,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2746/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 8.295025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:42,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.65944 samples/s/p 2:36:10 } +2024-07-30 03:31:44,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2748/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 8.292424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:44,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.65912 samples/s/p 2:36:08 } +2024-07-30 03:31:47,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2750/ 3125], loss: 0.223, per_step_time: 1414ms, lr: 8.289823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:47,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.65688 samples/s/p 2:36:09 } +2024-07-30 03:31:50,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2752/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 8.287221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:50,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.65802 samples/s/p 2:36:04 } +2024-07-30 03:31:53,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2754/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 8.284617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:53,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.66138 samples/s/p 2:35:56 } +2024-07-30 03:31:56,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2756/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 8.282012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:56,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.65821 samples/s/p 2:35:58 } +2024-07-30 03:31:59,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2758/ 3125], loss: 0.384, per_step_time: 1413ms, lr: 8.279404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:59,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.65993 samples/s/p 2:35:52 } +2024-07-30 03:32:01,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2760/ 3125], loss: 0.341, per_step_time: 1412ms, lr: 8.276795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:01,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.66259 samples/s/p 2:35:45 } +2024-07-30 03:32:04,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2762/ 3125], loss: 0.064, per_step_time: 1412ms, lr: 8.274184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:04,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.66188 samples/s/p 2:35:43 } +2024-07-30 03:32:07,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2764/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 8.271573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:07,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.65785 samples/s/p 2:35:47 } +2024-07-30 03:32:10,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2766/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 8.26896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:10,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.66087 samples/s/p 2:35:39 } +2024-07-30 03:32:13,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2768/ 3125], loss: 0.217, per_step_time: 1414ms, lr: 8.266344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:13,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.65566 samples/s/p 2:35:45 } +2024-07-30 03:32:16,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2770/ 3125], loss: 0.292, per_step_time: 1417ms, lr: 8.263728e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:16,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.64554 samples/s/p 2:35:59 } +2024-07-30 03:32:18,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2772/ 3125], loss: 0.183, per_step_time: 1414ms, lr: 8.2611095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:18,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.65715 samples/s/p 2:35:37 } +2024-07-30 03:32:21,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2774/ 3125], loss: 0.234, per_step_time: 1416ms, lr: 8.25849e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:21,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.64744 samples/s/p 2:35:50 } +2024-07-30 03:32:24,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2776/ 3125], loss: 0.142, per_step_time: 1413ms, lr: 8.255868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:24,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.65852 samples/s/p 2:35:29 } +2024-07-30 03:32:27,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2778/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 8.253245e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:27,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.66002 samples/s/p 2:35:24 } +2024-07-30 03:32:30,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2780/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 8.250621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:30,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.66109 samples/s/p 2:35:19 } +2024-07-30 03:32:33,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2782/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 8.2479955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:33,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.65949 samples/s/p 2:35:19 } +2024-07-30 03:32:35,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2784/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 8.245368e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:35,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.66059 samples/s/p 2:35:14 } +2024-07-30 03:32:38,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2786/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 8.242739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:38,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.66011 samples/s/p 2:35:12 } +2024-07-30 03:32:41,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2788/ 3125], loss: 0.381, per_step_time: 1413ms, lr: 8.240108e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:41,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.65843 samples/s/p 2:35:12 } +2024-07-30 03:32:44,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2790/ 3125], loss: 0.280, per_step_time: 1412ms, lr: 8.237476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:44,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.66219 samples/s/p 2:35:03 } +2024-07-30 03:32:47,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2792/ 3125], loss: 0.209, per_step_time: 1414ms, lr: 8.234842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:47,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.65478 samples/s/p 2:35:13 } +2024-07-30 03:32:50,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2794/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 8.2322085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:50,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.65857 samples/s/p 2:35:04 } +2024-07-30 03:32:52,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2796/ 3125], loss: 0.398, per_step_time: 1412ms, lr: 8.22957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:52,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.66300 samples/s/p 2:34:54 } +2024-07-30 03:32:55,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2798/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 8.226932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:55,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.66050 samples/s/p 2:34:55 } +2024-07-30 03:32:58,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2800/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 8.224293e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:58,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.65906 samples/s/p 2:34:54 } +2024-07-30 03:32:58,651 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 03:33:33,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2802/ 3125], loss: 0.252, per_step_time: 1447ms, lr: 8.221651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:33,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.52677 samples/s/p 2:38:34 } +2024-07-30 03:33:36,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2804/ 3125], loss: 0.293, per_step_time: 1413ms, lr: 8.219007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:36,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.65893 samples/s/p 2:34:49 } +2024-07-30 03:33:39,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2806/ 3125], loss: 0.327, per_step_time: 1413ms, lr: 8.216363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:39,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.66108 samples/s/p 2:34:43 } +2024-07-30 03:33:42,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2808/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 8.213718e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:42,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.65809 samples/s/p 2:34:45 } +2024-07-30 03:33:44,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2810/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 8.211069e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:44,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.66121 samples/s/p 2:34:37 } +2024-07-30 03:33:47,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2812/ 3125], loss: 0.370, per_step_time: 1414ms, lr: 8.208421e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:47,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.65758 samples/s/p 2:34:40 } +2024-07-30 03:33:50,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2814/ 3125], loss: 0.436, per_step_time: 1413ms, lr: 8.20577e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:50,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |███████████████ | 5.66097 samples/s/p 2:34:31 } +2024-07-30 03:33:53,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2816/ 3125], loss: 0.281, per_step_time: 1414ms, lr: 8.203118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:53,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |███████████████ | 5.65621 samples/s/p 2:34:36 } +2024-07-30 03:33:56,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2818/ 3125], loss: 0.163, per_step_time: 1416ms, lr: 8.200464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:56,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.64754 samples/s/p 2:34:48 } +2024-07-30 03:33:59,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2820/ 3125], loss: 0.291, per_step_time: 1412ms, lr: 8.19781e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:59,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.66173 samples/s/p 2:34:22 } +2024-07-30 03:34:02,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2822/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 8.195152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:02,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.66085 samples/s/p 2:34:20 } +2024-07-30 03:34:04,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2824/ 3125], loss: 0.480, per_step_time: 1421ms, lr: 8.1924945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:04,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.62858 samples/s/p 2:35:11 } +2024-07-30 03:34:07,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2826/ 3125], loss: 0.451, per_step_time: 1412ms, lr: 8.189835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:07,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.66198 samples/s/p 2:34:13 } +2024-07-30 03:34:10,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2828/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 8.187173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:10,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.65925 samples/s/p 2:34:14 } +2024-07-30 03:34:13,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2830/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 8.184512e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:13,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.65954 samples/s/p 2:34:11 } +2024-07-30 03:34:16,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2832/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 8.181846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:16,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.65996 samples/s/p 2:34:08 } +2024-07-30 03:34:19,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2834/ 3125], loss: 0.295, per_step_time: 1415ms, lr: 8.17918e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:19,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.65353 samples/s/p 2:34:15 } +2024-07-30 03:34:21,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2836/ 3125], loss: 0.293, per_step_time: 1413ms, lr: 8.176514e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:21,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.66162 samples/s/p 2:33:59 } +2024-07-30 03:34:24,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2838/ 3125], loss: 0.379, per_step_time: 1413ms, lr: 8.1738435e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:24,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.65857 samples/s/p 2:34:01 } +2024-07-30 03:34:27,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2840/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 8.171173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:27,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.66136 samples/s/p 2:33:54 } +2024-07-30 03:34:30,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2842/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.168502e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:30,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.65867 samples/s/p 2:33:56 } +2024-07-30 03:34:33,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2844/ 3125], loss: 0.376, per_step_time: 1413ms, lr: 8.165828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:33,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.66038 samples/s/p 2:33:50 } +2024-07-30 03:34:36,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2846/ 3125], loss: 0.265, per_step_time: 1414ms, lr: 8.163152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:36,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.65459 samples/s/p 2:33:57 } +2024-07-30 03:34:38,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2848/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 8.160477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:38,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.65840 samples/s/p 2:33:48 } +2024-07-30 03:34:41,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2850/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 8.157799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:41,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.65896 samples/s/p 2:33:44 } +2024-07-30 03:34:44,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2852/ 3125], loss: 0.294, per_step_time: 1425ms, lr: 8.155119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:44,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.61221 samples/s/p 2:34:58 } +2024-07-30 03:34:47,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2854/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 8.152439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:47,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.66124 samples/s/p 2:33:34 } +2024-07-30 03:34:50,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2856/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 8.149756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:50,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.66120 samples/s/p 2:33:32 } +2024-07-30 03:34:53,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2858/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 8.147072e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:53,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.66035 samples/s/p 2:33:30 } +2024-07-30 03:34:55,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2860/ 3125], loss: 0.232, per_step_time: 1415ms, lr: 8.144387e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:55,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.65196 samples/s/p 2:33:41 } +2024-07-30 03:34:58,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2862/ 3125], loss: 0.199, per_step_time: 1415ms, lr: 8.1417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:58,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.65122 samples/s/p 2:33:39 } +2024-07-30 03:35:01,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2864/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 8.139012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:01,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.65965 samples/s/p 2:33:23 } +2024-07-30 03:35:04,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2866/ 3125], loss: 0.137, per_step_time: 1414ms, lr: 8.1363205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:04,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.65606 samples/s/p 2:33:26 } +2024-07-30 03:35:07,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2868/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 8.133629e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:07,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.66028 samples/s/p 2:33:16 } +2024-07-30 03:35:10,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2870/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 8.130936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:10,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.66028 samples/s/p 2:33:13 } +2024-07-30 03:35:13,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2872/ 3125], loss: 0.205, per_step_time: 1417ms, lr: 8.1282415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:13,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.64458 samples/s/p 2:33:36 } +2024-07-30 03:35:16,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2874/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 8.125546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:16,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.66021 samples/s/p 2:33:08 } +2024-07-30 03:35:19,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2876/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 8.122848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:19,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.65873 samples/s/p 2:33:07 } +2024-07-30 03:35:21,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2878/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 8.12015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:21,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.65985 samples/s/p 2:33:03 } +2024-07-30 03:35:24,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2880/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 8.117449e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:24,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.66122 samples/s/p 2:32:58 } +2024-07-30 03:35:27,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2882/ 3125], loss: 0.242, per_step_time: 1414ms, lr: 8.114746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:27,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.65725 samples/s/p 2:33:01 } +2024-07-30 03:35:30,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2884/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 8.112043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:30,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.65875 samples/s/p 2:32:56 } +2024-07-30 03:35:33,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2886/ 3125], loss: 0.262, per_step_time: 1415ms, lr: 8.109339e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:33,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.65206 samples/s/p 2:33:04 } +2024-07-30 03:35:36,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2888/ 3125], loss: 0.190, per_step_time: 1417ms, lr: 8.106633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:36,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.64416 samples/s/p 2:33:14 } +2024-07-30 03:35:38,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2890/ 3125], loss: 0.192, per_step_time: 1414ms, lr: 8.103924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:38,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.65758 samples/s/p 2:32:49 } +2024-07-30 03:35:41,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2892/ 3125], loss: 0.357, per_step_time: 1414ms, lr: 8.101215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:41,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.65623 samples/s/p 2:32:49 } +2024-07-30 03:35:44,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2894/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 8.098505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:44,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.66028 samples/s/p 2:32:39 } +2024-07-30 03:35:47,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2896/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 8.0957925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:47,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.65722 samples/s/p 2:32:42 } +2024-07-30 03:35:50,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2898/ 3125], loss: 0.418, per_step_time: 1413ms, lr: 8.0930795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:50,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.65850 samples/s/p 2:32:37 } +2024-07-30 03:35:53,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2900/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 8.090362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:53,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.66037 samples/s/p 2:32:31 } +2024-07-30 03:35:55,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2902/ 3125], loss: 0.190, per_step_time: 1414ms, lr: 8.087645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:55,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.65475 samples/s/p 2:32:37 } +2024-07-30 03:35:58,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2904/ 3125], loss: 0.252, per_step_time: 1415ms, lr: 8.084929e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:58,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.65025 samples/s/p 2:32:42 } +2024-07-30 03:36:01,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2906/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 8.082207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:01,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.66165 samples/s/p 2:32:20 } +2024-07-30 03:36:04,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2908/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 8.079487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:04,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.65930 samples/s/p 2:32:21 } +2024-07-30 03:36:07,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2910/ 3125], loss: 0.122, per_step_time: 1413ms, lr: 8.076764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:07,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.66040 samples/s/p 2:32:17 } +2024-07-30 03:36:10,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2912/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 8.07404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:10,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.65936 samples/s/p 2:32:16 } +2024-07-30 03:36:13,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2914/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 8.071315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:13,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.65972 samples/s/p 2:32:12 } +2024-07-30 03:36:15,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2916/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 8.068589e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:15,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.65958 samples/s/p 2:32:10 } +2024-07-30 03:36:18,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2918/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 8.065859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:18,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.65910 samples/s/p 2:32:07 } +2024-07-30 03:36:21,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2920/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 8.063129e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:21,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.66075 samples/s/p 2:32:02 } +2024-07-30 03:36:24,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2922/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 8.060398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:24,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.66043 samples/s/p 2:32:00 } +2024-07-30 03:36:27,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2924/ 3125], loss: 0.187, per_step_time: 1414ms, lr: 8.057666e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:27,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.65694 samples/s/p 2:32:02 } +2024-07-30 03:36:30,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2926/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 8.05493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:30,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.66024 samples/s/p 2:31:54 } +2024-07-30 03:36:32,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2928/ 3125], loss: 0.356, per_step_time: 1414ms, lr: 8.052194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:32,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.65752 samples/s/p 2:31:56 } +2024-07-30 03:36:35,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2930/ 3125], loss: 0.226, per_step_time: 1414ms, lr: 8.049457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:35,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.65672 samples/s/p 2:31:54 } +2024-07-30 03:36:38,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2932/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 8.046719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:38,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.65937 samples/s/p 2:31:47 } +2024-07-30 03:36:41,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2934/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 8.043978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:41,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.66053 samples/s/p 2:31:43 } +2024-07-30 03:36:44,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2936/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 8.0412365e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:44,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.65946 samples/s/p 2:31:41 } +2024-07-30 03:36:47,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2938/ 3125], loss: 0.393, per_step_time: 1413ms, lr: 8.038493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:47,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.65965 samples/s/p 2:31:38 } +2024-07-30 03:36:49,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2940/ 3125], loss: 0.201, per_step_time: 1414ms, lr: 8.035749e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:49,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.65470 samples/s/p 2:31:43 } +2024-07-30 03:36:52,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2942/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 8.033003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:52,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.65926 samples/s/p 2:31:33 } +2024-07-30 03:36:55,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2944/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 8.030256e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:55,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.65980 samples/s/p 2:31:30 } +2024-07-30 03:36:58,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2946/ 3125], loss: 0.417, per_step_time: 1413ms, lr: 8.027507e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:58,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.65879 samples/s/p 2:31:28 } +2024-07-30 03:37:01,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2948/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 8.024756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:01,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.65907 samples/s/p 2:31:25 } +2024-07-30 03:37:04,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2950/ 3125], loss: 0.508, per_step_time: 1413ms, lr: 8.022005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:04,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.65959 samples/s/p 2:31:21 } +2024-07-30 03:37:06,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2952/ 3125], loss: 0.124, per_step_time: 1415ms, lr: 8.019252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:06,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.65010 samples/s/p 2:31:34 } +2024-07-30 03:37:09,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2954/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 8.016496e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:09,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.66161 samples/s/p 2:31:13 } +2024-07-30 03:37:12,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2956/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 8.013741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:12,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.66071 samples/s/p 2:31:11 } +2024-07-30 03:37:15,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2958/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 8.010983e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:15,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.65881 samples/s/p 2:31:11 } +2024-07-30 03:37:18,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2960/ 3125], loss: 0.058, per_step_time: 1413ms, lr: 8.008224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:18,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.66008 samples/s/p 2:31:07 } +2024-07-30 03:37:21,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2962/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 8.005464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:21,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.65884 samples/s/p 2:31:06 } +2024-07-30 03:37:23,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2964/ 3125], loss: 0.201, per_step_time: 1414ms, lr: 8.002702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:23,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.65432 samples/s/p 2:31:10 } +2024-07-30 03:37:26,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2966/ 3125], loss: 0.116, per_step_time: 1413ms, lr: 7.999938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:26,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.65981 samples/s/p 2:30:58 } +2024-07-30 03:37:29,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2968/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 7.997174e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:29,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.65909 samples/s/p 2:30:57 } +2024-07-30 03:37:32,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2970/ 3125], loss: 0.396, per_step_time: 1414ms, lr: 7.9944075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:32,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.65546 samples/s/p 2:31:00 } +2024-07-30 03:37:35,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2972/ 3125], loss: 0.248, per_step_time: 1414ms, lr: 7.991641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:35,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.65672 samples/s/p 2:30:55 } +2024-07-30 03:37:38,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2974/ 3125], loss: 0.402, per_step_time: 1415ms, lr: 7.988871e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:38,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.65263 samples/s/p 2:30:59 } +2024-07-30 03:37:40,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2976/ 3125], loss: 0.045, per_step_time: 1413ms, lr: 7.986101e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:40,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.66098 samples/s/p 2:30:42 } +2024-07-30 03:37:43,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2978/ 3125], loss: 0.486, per_step_time: 1413ms, lr: 7.983329e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:43,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.65926 samples/s/p 2:30:42 } +2024-07-30 03:37:46,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2980/ 3125], loss: 0.218, per_step_time: 1414ms, lr: 7.980555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:46,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.65627 samples/s/p 2:30:44 } +2024-07-30 03:37:49,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2982/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 7.977781e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:49,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.66059 samples/s/p 2:30:35 } +2024-07-30 03:37:52,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2984/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 7.975005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:52,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.65916 samples/s/p 2:30:34 } +2024-07-30 03:37:55,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2986/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 7.972229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:55,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.66144 samples/s/p 2:30:28 } +2024-07-30 03:37:57,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2988/ 3125], loss: 0.165, per_step_time: 1414ms, lr: 7.969448e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:57,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.65693 samples/s/p 2:30:32 } +2024-07-30 03:38:00,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2990/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 7.966668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:00,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.66144 samples/s/p 2:30:22 } +2024-07-30 03:38:03,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2992/ 3125], loss: 0.206, per_step_time: 1415ms, lr: 7.963886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:03,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.65285 samples/s/p 2:30:33 } +2024-07-30 03:38:06,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2994/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 7.961103e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:06,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.65608 samples/s/p 2:30:25 } +2024-07-30 03:38:09,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2996/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 7.958318e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:09,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |███████████████ | 5.65905 samples/s/p 2:30:17 } +2024-07-30 03:38:12,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2998/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 7.955532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:12,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |███████████████ | 5.66038 samples/s/p 2:30:12 } +2024-07-30 03:38:14,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3000/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 7.952744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:14,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.65924 samples/s/p 2:30:11 } +2024-07-30 03:38:17,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3002/ 3125], loss: 0.105, per_step_time: 1413ms, lr: 7.949957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:17,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.66015 samples/s/p 2:30:07 } +2024-07-30 03:38:20,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3004/ 3125], loss: 0.164, per_step_time: 1413ms, lr: 7.9471665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:20,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.65966 samples/s/p 2:30:05 } +2024-07-30 03:38:23,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3006/ 3125], loss: 0.330, per_step_time: 1413ms, lr: 7.9443735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:23,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.66090 samples/s/p 2:30:00 } +2024-07-30 03:38:26,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3008/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 7.94158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:26,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.65871 samples/s/p 2:30:01 } +2024-07-30 03:38:29,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3010/ 3125], loss: 0.503, per_step_time: 1412ms, lr: 7.938786e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:29,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.66191 samples/s/p 2:29:53 } +2024-07-30 03:38:31,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3012/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 7.93599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:31,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.66011 samples/s/p 2:29:53 } +2024-07-30 03:38:34,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3014/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 7.933193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:34,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.65883 samples/s/p 2:29:52 } +2024-07-30 03:38:37,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3016/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 7.9303945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:37,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.65917 samples/s/p 2:29:49 } +2024-07-30 03:38:40,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3018/ 3125], loss: 0.073, per_step_time: 1413ms, lr: 7.927595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:40,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.66048 samples/s/p 2:29:44 } +2024-07-30 03:38:43,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3020/ 3125], loss: 0.311, per_step_time: 1415ms, lr: 7.924794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:43,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.65272 samples/s/p 2:29:53 } +2024-07-30 03:38:46,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3022/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 7.92199e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:46,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.65842 samples/s/p 2:29:42 } +2024-07-30 03:38:48,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3024/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 7.919186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:48,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.66008 samples/s/p 2:29:36 } +2024-07-30 03:38:51,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3026/ 3125], loss: 0.484, per_step_time: 1414ms, lr: 7.91638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:51,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.65634 samples/s/p 2:29:39 } +2024-07-30 03:38:54,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3028/ 3125], loss: 0.343, per_step_time: 1415ms, lr: 7.9135725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:54,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.65362 samples/s/p 2:29:41 } +2024-07-30 03:38:57,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3030/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 7.910764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:57,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.65780 samples/s/p 2:29:31 } +2024-07-30 03:39:00,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3032/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 7.907955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:00,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.65626 samples/s/p 2:29:31 } +2024-07-30 03:39:03,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3034/ 3125], loss: 0.175, per_step_time: 1414ms, lr: 7.905143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:03,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.65391 samples/s/p 2:29:32 } +2024-07-30 03:39:05,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3036/ 3125], loss: 0.197, per_step_time: 1413ms, lr: 7.902331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:05,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.66139 samples/s/p 2:29:17 } +2024-07-30 03:39:08,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3038/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 7.899518e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:08,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.66090 samples/s/p 2:29:15 } +2024-07-30 03:39:11,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3040/ 3125], loss: 0.386, per_step_time: 1412ms, lr: 7.896702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:11,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.66269 samples/s/p 2:29:09 } +2024-07-30 03:39:14,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3042/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 7.893886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:14,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.65863 samples/s/p 2:29:13 } +2024-07-30 03:39:17,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3044/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 7.891067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:17,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.66076 samples/s/p 2:29:07 } +2024-07-30 03:39:20,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3046/ 3125], loss: 0.483, per_step_time: 1412ms, lr: 7.888248e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:20,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.66255 samples/s/p 2:29:01 } +2024-07-30 03:39:22,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3048/ 3125], loss: 0.188, per_step_time: 1412ms, lr: 7.885426e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:22,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.66173 samples/s/p 2:29:00 } +2024-07-30 03:39:25,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3050/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 7.882604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:25,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.66157 samples/s/p 2:28:57 } +2024-07-30 03:39:28,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3052/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 7.87978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:28,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.66093 samples/s/p 2:28:55 } +2024-07-30 03:39:31,405 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3054/ 3125], loss: 0.430, per_step_time: 1413ms, lr: 7.876955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:31,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.66030 samples/s/p 2:28:53 } +2024-07-30 03:39:34,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3056/ 3125], loss: 0.063, per_step_time: 1413ms, lr: 7.874129e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:34,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.66137 samples/s/p 2:28:49 } +2024-07-30 03:39:37,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3058/ 3125], loss: 0.166, per_step_time: 1414ms, lr: 7.871301e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:37,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.65729 samples/s/p 2:28:52 } +2024-07-30 03:39:39,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3060/ 3125], loss: 0.244, per_step_time: 1412ms, lr: 7.8684725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:39,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.66196 samples/s/p 2:28:42 } +2024-07-30 03:39:42,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3062/ 3125], loss: 0.327, per_step_time: 1413ms, lr: 7.865641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:42,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.66083 samples/s/p 2:28:41 } +2024-07-30 03:39:45,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3064/ 3125], loss: 0.158, per_step_time: 1413ms, lr: 7.862808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:45,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.65881 samples/s/p 2:28:42 } +2024-07-30 03:39:48,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3066/ 3125], loss: 0.247, per_step_time: 1412ms, lr: 7.859976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:48,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.66212 samples/s/p 2:28:33 } +2024-07-30 03:39:51,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3068/ 3125], loss: 0.360, per_step_time: 1414ms, lr: 7.857141e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:51,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.65656 samples/s/p 2:28:39 } +2024-07-30 03:39:54,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3070/ 3125], loss: 0.408, per_step_time: 1415ms, lr: 7.854305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:54,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.65283 samples/s/p 2:28:42 } +2024-07-30 03:39:56,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3072/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 7.851468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:56,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.65939 samples/s/p 2:28:29 } +2024-07-30 03:39:59,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3074/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 7.84863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:59,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.65949 samples/s/p 2:28:26 } +2024-07-30 03:40:02,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3076/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 7.845789e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:02,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.65933 samples/s/p 2:28:24 } +2024-07-30 03:40:05,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3078/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 7.842948e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:05,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.65926 samples/s/p 2:28:21 } +2024-07-30 03:40:08,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3080/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 7.840105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:08,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.65916 samples/s/p 2:28:18 } +2024-07-30 03:40:11,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3082/ 3125], loss: 0.274, per_step_time: 1414ms, lr: 7.8372605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:11,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.65587 samples/s/p 2:28:21 } +2024-07-30 03:40:13,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3084/ 3125], loss: 0.207, per_step_time: 1414ms, lr: 7.834416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:13,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.65678 samples/s/p 2:28:16 } +2024-07-30 03:40:16,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3086/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 7.831569e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:16,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.66081 samples/s/p 2:28:07 } +2024-07-30 03:40:19,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3088/ 3125], loss: 0.198, per_step_time: 1412ms, lr: 7.82872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:19,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.66196 samples/s/p 2:28:03 } +2024-07-30 03:40:22,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3090/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 7.825871e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:22,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.66002 samples/s/p 2:28:03 } +2024-07-30 03:40:25,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3092/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 7.82302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:25,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.65924 samples/s/p 2:28:01 } +2024-07-30 03:40:28,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3094/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 7.820167e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:28,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.65893 samples/s/p 2:27:59 } +2024-07-30 03:40:30,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3096/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 7.817314e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:30,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.66019 samples/s/p 2:27:54 } +2024-07-30 03:40:33,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3098/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 7.814459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:33,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.65884 samples/s/p 2:27:53 } +2024-07-30 03:40:36,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3100/ 3125], loss: 0.094, per_step_time: 1413ms, lr: 7.811602e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:36,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.65968 samples/s/p 2:27:49 } +2024-07-30 03:40:39,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3102/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 7.808745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:39,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.65844 samples/s/p 2:27:48 } +2024-07-30 03:40:42,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3104/ 3125], loss: 0.542, per_step_time: 1414ms, lr: 7.8058865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:42,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.65502 samples/s/p 2:27:51 } +2024-07-30 03:40:45,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3106/ 3125], loss: 0.421, per_step_time: 1413ms, lr: 7.803026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:45,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.66036 samples/s/p 2:27:40 } +2024-07-30 03:40:47,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3108/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 7.800165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:47,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.66036 samples/s/p 2:27:37 } +2024-07-30 03:40:50,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3110/ 3125], loss: 0.137, per_step_time: 1413ms, lr: 7.797301e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:50,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.66058 samples/s/p 2:27:34 } +2024-07-30 03:40:53,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3112/ 3125], loss: 0.390, per_step_time: 1413ms, lr: 7.794437e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:53,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.66112 samples/s/p 2:27:30 } +2024-07-30 03:40:56,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3114/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 7.791571e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:56,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.66000 samples/s/p 2:27:29 } +2024-07-30 03:40:59,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3116/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 7.788703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:59,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.66115 samples/s/p 2:27:24 } +2024-07-30 03:41:02,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3118/ 3125], loss: 0.107, per_step_time: 1414ms, lr: 7.785835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:02,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.65607 samples/s/p 2:27:29 } +2024-07-30 03:41:04,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3120/ 3125], loss: 0.323, per_step_time: 1414ms, lr: 7.782965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:04,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.65743 samples/s/p 2:27:25 } +2024-07-30 03:41:07,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3122/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 7.780095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:07,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.65902 samples/s/p 2:27:19 } +2024-07-30 03:41:10,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3124/ 3125], loss: 0.356, per_step_time: 1413ms, lr: 7.777224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:10,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.65814 samples/s/p 2:27:18 } +2024-07-30 03:41:13,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 7.774349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:13,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.65773 samples/s/p 2:27:16 } +2024-07-30 03:41:16,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3/ 3125], loss: 0.242, per_step_time: 1414ms, lr: 7.771474e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:16,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.65725 samples/s/p 2:27:13 } +2024-07-30 03:41:19,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 5/ 3125], loss: 0.122, per_step_time: 1413ms, lr: 7.768598e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:19,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.65833 samples/s/p 2:27:09 } +2024-07-30 03:41:21,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 7/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 7.7657205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:21,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.65998 samples/s/p 2:27:04 } +2024-07-30 03:41:24,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 9/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 7.762842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:24,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.65857 samples/s/p 2:27:03 } +2024-07-30 03:41:27,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 11/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 7.759961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:27,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.65778 samples/s/p 2:27:01 } +2024-07-30 03:41:30,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 13/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 7.757079e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:30,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.66094 samples/s/p 2:26:54 } +2024-07-30 03:41:33,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 15/ 3125], loss: 0.090, per_step_time: 1413ms, lr: 7.754197e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:33,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.66107 samples/s/p 2:26:51 } +2024-07-30 03:41:36,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 17/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 7.751312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:36,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.66012 samples/s/p 2:26:49 } +2024-07-30 03:41:38,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 19/ 3125], loss: 0.346, per_step_time: 1413ms, lr: 7.748427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:38,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.66144 samples/s/p 2:26:44 } +2024-07-30 03:41:41,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 21/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 7.74554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:41,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.66009 samples/s/p 2:26:44 } +2024-07-30 03:41:44,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 23/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 7.742651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:44,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.65998 samples/s/p 2:26:41 } +2024-07-30 03:41:47,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 25/ 3125], loss: 0.442, per_step_time: 1413ms, lr: 7.739762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:47,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.66000 samples/s/p 2:26:38 } +2024-07-30 03:41:50,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 27/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 7.736871e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:50,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.65829 samples/s/p 2:26:38 } +2024-07-30 03:41:53,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 29/ 3125], loss: 0.158, per_step_time: 1413ms, lr: 7.733979e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:53,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.66154 samples/s/p 2:26:30 } +2024-07-30 03:41:55,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 31/ 3125], loss: 0.160, per_step_time: 1413ms, lr: 7.731086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:55,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.65965 samples/s/p 2:26:30 } +2024-07-30 03:41:58,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 33/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 7.728191e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:58,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.66015 samples/s/p 2:26:27 } +2024-07-30 03:42:01,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 35/ 3125], loss: 0.050, per_step_time: 1413ms, lr: 7.725296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:01,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.66057 samples/s/p 2:26:23 } +2024-07-30 03:42:04,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 37/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 7.7223995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:04,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.65913 samples/s/p 2:26:22 } +2024-07-30 03:42:07,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 39/ 3125], loss: 0.476, per_step_time: 1413ms, lr: 7.7195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:07,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.65779 samples/s/p 2:26:22 } +2024-07-30 03:42:10,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 41/ 3125], loss: 0.196, per_step_time: 1412ms, lr: 7.7166005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:10,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.66210 samples/s/p 2:26:12 } +2024-07-30 03:42:12,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 43/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 7.713699e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:12,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.65989 samples/s/p 2:26:13 } +2024-07-30 03:42:15,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 45/ 3125], loss: 0.356, per_step_time: 1413ms, lr: 7.710796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:15,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.65951 samples/s/p 2:26:11 } +2024-07-30 03:42:18,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 47/ 3125], loss: 0.262, per_step_time: 1414ms, lr: 7.707892e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:18,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.65599 samples/s/p 2:26:13 } +2024-07-30 03:42:21,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 49/ 3125], loss: 0.134, per_step_time: 1415ms, lr: 7.704987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:21,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.65313 samples/s/p 2:26:15 } +2024-07-30 03:42:24,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 51/ 3125], loss: 0.254, per_step_time: 1415ms, lr: 7.702081e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:24,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.65348 samples/s/p 2:26:11 } +2024-07-30 03:42:27,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 53/ 3125], loss: 0.330, per_step_time: 1414ms, lr: 7.699174e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:27,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.65659 samples/s/p 2:26:04 } +2024-07-30 03:42:29,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 55/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 7.696265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:29,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.65998 samples/s/p 2:25:56 } +2024-07-30 03:42:32,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 57/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 7.693354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:32,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.66134 samples/s/p 2:25:51 } +2024-07-30 03:42:35,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 59/ 3125], loss: 0.539, per_step_time: 1413ms, lr: 7.6904425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:35,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |████████████████ | 5.66042 samples/s/p 2:25:49 } +2024-07-30 03:42:38,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 61/ 3125], loss: 0.441, per_step_time: 1413ms, lr: 7.687529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:38,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |████████████████ | 5.65926 samples/s/p 2:25:48 } +2024-07-30 03:42:41,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 63/ 3125], loss: 0.299, per_step_time: 1414ms, lr: 7.684615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:41,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.65762 samples/s/p 2:25:48 } +2024-07-30 03:42:44,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 65/ 3125], loss: 0.268, per_step_time: 1412ms, lr: 7.6817005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:44,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.66193 samples/s/p 2:25:39 } +2024-07-30 03:42:46,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 67/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 7.678784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:46,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.65830 samples/s/p 2:25:41 } +2024-07-30 03:42:49,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 69/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 7.675866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:49,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.65821 samples/s/p 2:25:39 } +2024-07-30 03:42:52,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 71/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 7.6729475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:52,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.65943 samples/s/p 2:25:34 } +2024-07-30 03:42:55,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 73/ 3125], loss: 0.266, per_step_time: 1425ms, lr: 7.670027e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:55,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.61281 samples/s/p 2:26:44 } +2024-07-30 03:42:58,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 75/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 7.667105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:58,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.66085 samples/s/p 2:25:26 } +2024-07-30 03:43:01,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 77/ 3125], loss: 0.197, per_step_time: 1413ms, lr: 7.664182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:01,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.65937 samples/s/p 2:25:26 } +2024-07-30 03:43:03,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 79/ 3125], loss: 0.398, per_step_time: 1413ms, lr: 7.661257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:03,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.65951 samples/s/p 2:25:23 } +2024-07-30 03:43:06,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 81/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 7.658331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:06,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.66067 samples/s/p 2:25:18 } +2024-07-30 03:43:09,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 83/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 7.655404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:09,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.66048 samples/s/p 2:25:15 } +2024-07-30 03:43:12,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 85/ 3125], loss: 0.280, per_step_time: 1412ms, lr: 7.652477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:12,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.66251 samples/s/p 2:25:09 } +2024-07-30 03:43:15,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 87/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 7.649548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:15,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.65843 samples/s/p 2:25:13 } +2024-07-30 03:43:18,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 89/ 3125], loss: 0.140, per_step_time: 1412ms, lr: 7.646618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:18,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.66304 samples/s/p 2:25:03 } +2024-07-30 03:43:20,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 91/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 7.643685e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:20,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.65902 samples/s/p 2:25:06 } +2024-07-30 03:43:23,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 93/ 3125], loss: 0.460, per_step_time: 1413ms, lr: 7.640752e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:23,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.65950 samples/s/p 2:25:03 } +2024-07-30 03:43:26,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 95/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 7.637817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:26,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.66134 samples/s/p 2:24:57 } +2024-07-30 03:43:29,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 97/ 3125], loss: 0.124, per_step_time: 1413ms, lr: 7.6348815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:29,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.66090 samples/s/p 2:24:55 } +2024-07-30 03:43:32,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 99/ 3125], loss: 0.180, per_step_time: 1414ms, lr: 7.631944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:32,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.65653 samples/s/p 2:24:59 } +2024-07-30 03:43:35,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 101/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 7.629007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:35,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.65814 samples/s/p 2:24:54 } +2024-07-30 03:43:37,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 103/ 3125], loss: 0.317, per_step_time: 1414ms, lr: 7.626067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:37,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.65732 samples/s/p 2:24:52 } +2024-07-30 03:43:40,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 105/ 3125], loss: 0.223, per_step_time: 1414ms, lr: 7.6231267e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:40,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.65746 samples/s/p 2:24:49 } +2024-07-30 03:43:43,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 107/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 7.6201854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:43,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.65684 samples/s/p 2:24:47 } +2024-07-30 03:43:46,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 109/ 3125], loss: 0.124, per_step_time: 1413ms, lr: 7.6172423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:46,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.65974 samples/s/p 2:24:40 } +2024-07-30 03:43:49,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 111/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 7.614297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:49,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.65853 samples/s/p 2:24:39 } +2024-07-30 03:43:52,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 113/ 3125], loss: 0.330, per_step_time: 1413ms, lr: 7.6113506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:52,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.66162 samples/s/p 2:24:31 } +2024-07-30 03:43:54,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 115/ 3125], loss: 0.049, per_step_time: 1412ms, lr: 7.608404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:54,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.66245 samples/s/p 2:24:27 } +2024-07-30 03:43:57,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 117/ 3125], loss: 0.554, per_step_time: 1413ms, lr: 7.6054557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:57,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.65836 samples/s/p 2:24:31 } +2024-07-30 03:44:00,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 119/ 3125], loss: 0.228, per_step_time: 1425ms, lr: 7.6025067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:00,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.61289 samples/s/p 2:25:38 } +2024-07-30 03:44:03,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 121/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 7.5995563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:03,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.66091 samples/s/p 2:24:21 } +2024-07-30 03:44:06,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 123/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 7.5966045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:06,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.65820 samples/s/p 2:24:22 } +2024-07-30 03:44:09,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 125/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 7.5936505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:09,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.65894 samples/s/p 2:24:18 } +2024-07-30 03:44:12,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 127/ 3125], loss: 0.366, per_step_time: 1414ms, lr: 7.5906964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:12,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.65589 samples/s/p 2:24:20 } +2024-07-30 03:44:14,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 129/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 7.5877415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:14,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.65773 samples/s/p 2:24:15 } +2024-07-30 03:44:17,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 131/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 7.5847843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:17,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.65994 samples/s/p 2:24:08 } +2024-07-30 03:44:20,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 133/ 3125], loss: 0.160, per_step_time: 1414ms, lr: 7.5818257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:20,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.65749 samples/s/p 2:24:09 } +2024-07-30 03:44:23,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 135/ 3125], loss: 0.249, per_step_time: 1414ms, lr: 7.578866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:23,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.65687 samples/s/p 2:24:07 } +2024-07-30 03:44:26,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 137/ 3125], loss: 0.145, per_step_time: 1413ms, lr: 7.5759062e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:26,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.65836 samples/s/p 2:24:02 } +2024-07-30 03:44:29,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 139/ 3125], loss: 0.216, per_step_time: 1415ms, lr: 7.5729445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:29,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.65236 samples/s/p 2:24:09 } +2024-07-30 03:44:31,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 141/ 3125], loss: 0.128, per_step_time: 1412ms, lr: 7.569982e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:31,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.66199 samples/s/p 2:23:51 } +2024-07-30 03:44:34,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 143/ 3125], loss: 0.354, per_step_time: 1414ms, lr: 7.567018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:34,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.65747 samples/s/p 2:23:55 } +2024-07-30 03:44:37,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 145/ 3125], loss: 0.406, per_step_time: 1412ms, lr: 7.5640514e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:37,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.66283 samples/s/p 2:23:44 } +2024-07-30 03:44:40,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 147/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 7.5610837e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:40,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.65907 samples/s/p 2:23:47 } +2024-07-30 03:44:43,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 149/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 7.5581165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:43,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.66126 samples/s/p 2:23:41 } +2024-07-30 03:44:46,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 151/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 7.555147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:46,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.66168 samples/s/p 2:23:37 } +2024-07-30 03:44:48,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 153/ 3125], loss: 0.151, per_step_time: 1413ms, lr: 7.5521775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:48,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.65905 samples/s/p 2:23:39 } +2024-07-30 03:44:51,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 155/ 3125], loss: 0.485, per_step_time: 1412ms, lr: 7.5492057e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:51,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.66208 samples/s/p 2:23:31 } +2024-07-30 03:44:54,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 157/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 7.5462335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:54,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.65982 samples/s/p 2:23:32 } +2024-07-30 03:44:57,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 159/ 3125], loss: 0.145, per_step_time: 1412ms, lr: 7.5432595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:57,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.66263 samples/s/p 2:23:25 } +2024-07-30 03:45:00,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 161/ 3125], loss: 0.241, per_step_time: 1412ms, lr: 7.5402836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:00,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.66248 samples/s/p 2:23:22 } +2024-07-30 03:45:03,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 163/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 7.5373077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:03,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.65872 samples/s/p 2:23:25 } +2024-07-30 03:45:05,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 165/ 3125], loss: 0.220, per_step_time: 1419ms, lr: 7.5343296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:05,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.63722 samples/s/p 2:23:55 } +2024-07-30 03:45:08,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 167/ 3125], loss: 0.382, per_step_time: 1414ms, lr: 7.5313505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:08,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.65702 samples/s/p 2:23:22 } +2024-07-30 03:45:11,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 169/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 7.5283706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:11,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.66131 samples/s/p 2:23:13 } +2024-07-30 03:45:14,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 171/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 7.525389e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:14,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.66049 samples/s/p 2:23:11 } +2024-07-30 03:45:17,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 173/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 7.522407e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:17,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.65802 samples/s/p 2:23:12 } +2024-07-30 03:45:20,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 175/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 7.519424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:20,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.65805 samples/s/p 2:23:09 } +2024-07-30 03:45:22,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 177/ 3125], loss: 0.129, per_step_time: 1413ms, lr: 7.516439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:22,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.66069 samples/s/p 2:23:02 } +2024-07-30 03:45:25,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 179/ 3125], loss: 0.139, per_step_time: 1413ms, lr: 7.5134526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:25,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.66087 samples/s/p 2:22:59 } +2024-07-30 03:45:28,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 181/ 3125], loss: 0.536, per_step_time: 1414ms, lr: 7.5104654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:28,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.65431 samples/s/p 2:23:06 } +2024-07-30 03:45:31,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 183/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 7.5074754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:31,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.65909 samples/s/p 2:22:56 } +2024-07-30 03:45:34,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 185/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 7.5044863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:34,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.66082 samples/s/p 2:22:51 } +2024-07-30 03:45:37,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 187/ 3125], loss: 0.253, per_step_time: 1414ms, lr: 7.501496e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:37,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.65528 samples/s/p 2:22:56 } +2024-07-30 03:45:39,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 189/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 7.4985037e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:39,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.65890 samples/s/p 2:22:48 } +2024-07-30 03:45:42,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 191/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 7.495511e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:42,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.65787 samples/s/p 2:22:47 } +2024-07-30 03:45:45,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 193/ 3125], loss: 0.382, per_step_time: 1413ms, lr: 7.4925165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:45,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.65925 samples/s/p 2:22:42 } +2024-07-30 03:45:48,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 195/ 3125], loss: 0.408, per_step_time: 1414ms, lr: 7.4895215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:48,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.65708 samples/s/p 2:22:42 } +2024-07-30 03:45:51,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 197/ 3125], loss: 0.272, per_step_time: 1417ms, lr: 7.4865234e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:51,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.64469 samples/s/p 2:22:58 } +2024-07-30 03:45:54,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 199/ 3125], loss: 0.393, per_step_time: 1414ms, lr: 7.4835257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:54,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.65511 samples/s/p 2:22:40 } +2024-07-30 03:45:56,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 201/ 3125], loss: 0.027, per_step_time: 1414ms, lr: 7.4805257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:56,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.65754 samples/s/p 2:22:33 } +2024-07-30 03:45:59,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 203/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 7.4775253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:59,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.65991 samples/s/p 2:22:27 } +2024-07-30 03:46:02,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 205/ 3125], loss: 0.199, per_step_time: 1414ms, lr: 7.4745244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:02,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.65698 samples/s/p 2:22:28 } +2024-07-30 03:46:05,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 207/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 7.4715217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:05,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.65983 samples/s/p 2:22:21 } +2024-07-30 03:46:08,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 209/ 3125], loss: 0.076, per_step_time: 1413ms, lr: 7.4685177e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:08,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.66111 samples/s/p 2:22:16 } +2024-07-30 03:46:11,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 211/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 7.465513e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:11,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.65949 samples/s/p 2:22:16 } +2024-07-30 03:46:13,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 213/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 7.462506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:13,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.65926 samples/s/p 2:22:13 } +2024-07-30 03:46:16,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 215/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 7.4594986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:16,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.66110 samples/s/p 2:22:08 } +2024-07-30 03:46:19,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 217/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 7.45649e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:19,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.65976 samples/s/p 2:22:07 } +2024-07-30 03:46:22,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 219/ 3125], loss: 0.121, per_step_time: 1412ms, lr: 7.4534796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:22,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.66176 samples/s/p 2:22:01 } +2024-07-30 03:46:25,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 221/ 3125], loss: 0.212, per_step_time: 1412ms, lr: 7.4504687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:25,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.66172 samples/s/p 2:21:58 } +2024-07-30 03:46:28,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 223/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 7.447457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:28,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.66062 samples/s/p 2:21:57 } +2024-07-30 03:46:30,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 225/ 3125], loss: 0.200, per_step_time: 1412ms, lr: 7.4444433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:30,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.66218 samples/s/p 2:21:52 } +2024-07-30 03:46:33,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 227/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 7.4414297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:33,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.65899 samples/s/p 2:21:54 } +2024-07-30 03:46:36,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 229/ 3125], loss: 0.117, per_step_time: 1412ms, lr: 7.438414e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:36,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.66185 samples/s/p 2:21:47 } +2024-07-30 03:46:39,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 231/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 7.4353975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:39,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.65887 samples/s/p 2:21:49 } +2024-07-30 03:46:42,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 233/ 3125], loss: 0.202, per_step_time: 1416ms, lr: 7.432379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:42,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.64822 samples/s/p 2:22:02 } +2024-07-30 03:46:45,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 235/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 7.429359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:45,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.65869 samples/s/p 2:21:43 } +2024-07-30 03:46:47,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 237/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 7.4263385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:47,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.66000 samples/s/p 2:21:38 } +2024-07-30 03:46:50,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 239/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 7.423317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:50,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.65988 samples/s/p 2:21:36 } +2024-07-30 03:46:53,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 241/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 7.4202953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:53,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.66133 samples/s/p 2:21:31 } +2024-07-30 03:46:56,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 243/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 7.4172717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:56,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.65777 samples/s/p 2:21:33 } +2024-07-30 03:46:59,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 245/ 3125], loss: 0.160, per_step_time: 1416ms, lr: 7.4142467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:59,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.64760 samples/s/p 2:21:46 } +2024-07-30 03:47:02,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 247/ 3125], loss: 0.308, per_step_time: 1415ms, lr: 7.4112213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:02,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |█████████████████ | 5.65364 samples/s/p 2:21:34 } +2024-07-30 03:47:04,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 249/ 3125], loss: 0.176, per_step_time: 1413ms, lr: 7.408193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:04,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |█████████████████ | 5.65973 samples/s/p 2:21:22 } +2024-07-30 03:47:07,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 251/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 7.4051645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:07,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.66086 samples/s/p 2:21:17 } +2024-07-30 03:47:10,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 253/ 3125], loss: 0.345, per_step_time: 1415ms, lr: 7.4021355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:10,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.65344 samples/s/p 2:21:26 } +2024-07-30 03:47:13,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 255/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 7.399104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:13,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.65818 samples/s/p 2:21:16 } +2024-07-30 03:47:16,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 257/ 3125], loss: 0.124, per_step_time: 1414ms, lr: 7.396072e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:16,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.65753 samples/s/p 2:21:14 } +2024-07-30 03:47:19,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 259/ 3125], loss: 0.261, per_step_time: 1415ms, lr: 7.393039e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:19,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.65204 samples/s/p 2:21:19 } +2024-07-30 03:47:21,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 261/ 3125], loss: 0.369, per_step_time: 1414ms, lr: 7.3900055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:21,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.65764 samples/s/p 2:21:08 } +2024-07-30 03:47:24,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 263/ 3125], loss: 0.533, per_step_time: 1414ms, lr: 7.3869705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:24,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.65664 samples/s/p 2:21:07 } +2024-07-30 03:47:27,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 265/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 7.383934e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:27,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.66085 samples/s/p 2:20:58 } +2024-07-30 03:47:30,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 267/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 7.380896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:30,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.65871 samples/s/p 2:20:58 } +2024-07-30 03:47:33,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 269/ 3125], loss: 0.090, per_step_time: 1413ms, lr: 7.377857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:33,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.65995 samples/s/p 2:20:53 } +2024-07-30 03:47:36,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 271/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 7.374817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:36,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.65947 samples/s/p 2:20:51 } +2024-07-30 03:47:38,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 273/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 7.371776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:38,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.65846 samples/s/p 2:20:50 } +2024-07-30 03:47:41,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 275/ 3125], loss: 0.238, per_step_time: 1414ms, lr: 7.3687343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:41,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.65731 samples/s/p 2:20:49 } +2024-07-30 03:47:44,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 277/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 7.3656915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:44,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.66131 samples/s/p 2:20:40 } +2024-07-30 03:47:47,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 279/ 3125], loss: 0.249, per_step_time: 1414ms, lr: 7.3626475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:47,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.65718 samples/s/p 2:20:43 } +2024-07-30 03:47:50,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 281/ 3125], loss: 0.255, per_step_time: 1414ms, lr: 7.3596025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:50,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.65694 samples/s/p 2:20:41 } +2024-07-30 03:47:53,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 283/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 7.3565557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:53,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.65844 samples/s/p 2:20:36 } +2024-07-30 03:47:55,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 285/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 7.353507e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:55,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.66156 samples/s/p 2:20:28 } +2024-07-30 03:47:58,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 287/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 7.350459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:58,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.65793 samples/s/p 2:20:31 } +2024-07-30 03:48:01,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 289/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 7.347408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:01,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.65918 samples/s/p 2:20:26 } +2024-07-30 03:48:04,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 291/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 7.344357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:04,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.66056 samples/s/p 2:20:21 } +2024-07-30 03:48:07,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 293/ 3125], loss: 0.194, per_step_time: 1414ms, lr: 7.341305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:07,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.65770 samples/s/p 2:20:23 } +2024-07-30 03:48:10,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 295/ 3125], loss: 0.137, per_step_time: 1413ms, lr: 7.338252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:10,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.65928 samples/s/p 2:20:18 } +2024-07-30 03:48:12,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 297/ 3125], loss: 0.263, per_step_time: 1412ms, lr: 7.3351976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:12,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.66207 samples/s/p 2:20:11 } +2024-07-30 03:48:15,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 299/ 3125], loss: 0.336, per_step_time: 1412ms, lr: 7.3321426e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:15,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.66185 samples/s/p 2:20:08 } +2024-07-30 03:48:18,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 301/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 7.329085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:18,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.65810 samples/s/p 2:20:11 } +2024-07-30 03:48:21,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 303/ 3125], loss: 0.321, per_step_time: 1413ms, lr: 7.3260276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:21,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.65981 samples/s/p 2:20:05 } +2024-07-30 03:48:24,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 305/ 3125], loss: 0.338, per_step_time: 1425ms, lr: 7.3229676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:24,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.61354 samples/s/p 2:21:12 } +2024-07-30 03:48:27,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 307/ 3125], loss: 0.191, per_step_time: 1415ms, lr: 7.319908e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:27,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.65275 samples/s/p 2:20:10 } +2024-07-30 03:48:29,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 309/ 3125], loss: 0.320, per_step_time: 1413ms, lr: 7.3168467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:29,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.66085 samples/s/p 2:19:55 } +2024-07-30 03:48:32,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 311/ 3125], loss: 0.349, per_step_time: 1413ms, lr: 7.313785e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:32,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.65790 samples/s/p 2:19:57 } +2024-07-30 03:48:35,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 313/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 7.3107217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:35,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.66043 samples/s/p 2:19:50 } +2024-07-30 03:48:38,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 315/ 3125], loss: 0.327, per_step_time: 1413ms, lr: 7.307658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:38,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.66036 samples/s/p 2:19:48 } +2024-07-30 03:48:41,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 317/ 3125], loss: 0.287, per_step_time: 1415ms, lr: 7.3045926e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:41,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.65213 samples/s/p 2:19:57 } +2024-07-30 03:48:44,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 319/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 7.301526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:44,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.66113 samples/s/p 2:19:41 } +2024-07-30 03:48:47,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 321/ 3125], loss: 0.260, per_step_time: 1414ms, lr: 7.2984576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:47,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.65442 samples/s/p 2:19:48 } +2024-07-30 03:48:49,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 323/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 7.2953876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:49,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.66054 samples/s/p 2:19:36 } +2024-07-30 03:48:52,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 325/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 7.292318e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:52,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.66086 samples/s/p 2:19:33 } +2024-07-30 03:48:55,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 327/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 7.289247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:55,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.66014 samples/s/p 2:19:31 } +2024-07-30 03:48:58,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 329/ 3125], loss: 0.272, per_step_time: 1414ms, lr: 7.2861753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:58,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.65476 samples/s/p 2:19:36 } +2024-07-30 03:49:01,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 331/ 3125], loss: 0.421, per_step_time: 1412ms, lr: 7.2831026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:01,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.66179 samples/s/p 2:19:23 } +2024-07-30 03:49:04,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 333/ 3125], loss: 0.387, per_step_time: 1413ms, lr: 7.280029e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:04,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.66126 samples/s/p 2:19:21 } +2024-07-30 03:49:06,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 335/ 3125], loss: 0.218, per_step_time: 1412ms, lr: 7.2769526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:06,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.66327 samples/s/p 2:19:15 } +2024-07-30 03:49:09,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 337/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 7.2738767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:09,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.65792 samples/s/p 2:19:20 } +2024-07-30 03:49:12,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 339/ 3125], loss: 0.399, per_step_time: 1413ms, lr: 7.270799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:12,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.65892 samples/s/p 2:19:16 } +2024-07-30 03:49:15,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 341/ 3125], loss: 0.279, per_step_time: 1415ms, lr: 7.2677194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:15,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.65150 samples/s/p 2:19:24 } +2024-07-30 03:49:18,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 343/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 7.2646403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:18,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.65987 samples/s/p 2:19:09 } +2024-07-30 03:49:21,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 345/ 3125], loss: 0.253, per_step_time: 1414ms, lr: 7.2615594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:21,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.65656 samples/s/p 2:19:11 } +2024-07-30 03:49:23,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 347/ 3125], loss: 0.124, per_step_time: 1414ms, lr: 7.2584776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:23,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.65673 samples/s/p 2:19:08 } +2024-07-30 03:49:26,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 349/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 7.255395e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:26,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.65922 samples/s/p 2:19:01 } +2024-07-30 03:49:29,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 351/ 3125], loss: 0.398, per_step_time: 1413ms, lr: 7.2523117e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:29,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.66121 samples/s/p 2:18:56 } +2024-07-30 03:49:32,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 353/ 3125], loss: 0.160, per_step_time: 1413ms, lr: 7.249226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:32,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.65806 samples/s/p 2:18:57 } +2024-07-30 03:49:35,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 355/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 7.2461407e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:35,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.65914 samples/s/p 2:18:53 } +2024-07-30 03:49:38,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 357/ 3125], loss: 0.162, per_step_time: 1415ms, lr: 7.2430526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:38,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.65351 samples/s/p 2:18:58 } +2024-07-30 03:49:40,858 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 359/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 7.2399635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:40,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.65856 samples/s/p 2:18:48 } +2024-07-30 03:49:43,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 361/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 7.236874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:43,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.65487 samples/s/p 2:18:51 } +2024-07-30 03:49:46,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 363/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 7.233784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:46,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.66140 samples/s/p 2:18:38 } +2024-07-30 03:49:49,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 365/ 3125], loss: 0.235, per_step_time: 1412ms, lr: 7.230693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:49,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.66213 samples/s/p 2:18:34 } +2024-07-30 03:49:52,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 367/ 3125], loss: 0.042, per_step_time: 1413ms, lr: 7.2276007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:52,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.66079 samples/s/p 2:18:34 } +2024-07-30 03:49:55,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 369/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 7.224507e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:55,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.66024 samples/s/p 2:18:32 } +2024-07-30 03:49:57,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 371/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 7.221411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:57,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.66019 samples/s/p 2:18:29 } +2024-07-30 03:50:00,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 373/ 3125], loss: 0.220, per_step_time: 1418ms, lr: 7.218316e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:00,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.63973 samples/s/p 2:18:56 } +2024-07-30 03:50:03,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 375/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 7.215219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:03,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.65879 samples/s/p 2:18:25 } +2024-07-30 03:50:06,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 377/ 3125], loss: 0.310, per_step_time: 1415ms, lr: 7.21212e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:06,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.65149 samples/s/p 2:18:33 } +2024-07-30 03:50:09,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 379/ 3125], loss: 0.083, per_step_time: 1413ms, lr: 7.209022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:09,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.66063 samples/s/p 2:18:17 } +2024-07-30 03:50:12,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 381/ 3125], loss: 0.318, per_step_time: 1412ms, lr: 7.205922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:12,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.66212 samples/s/p 2:18:12 } +2024-07-30 03:50:14,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 383/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 7.202821e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:14,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.66015 samples/s/p 2:18:12 } +2024-07-30 03:50:17,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 385/ 3125], loss: 0.288, per_step_time: 1414ms, lr: 7.199719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:17,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.65536 samples/s/p 2:18:16 } +2024-07-30 03:50:20,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 387/ 3125], loss: 0.111, per_step_time: 1414ms, lr: 7.1966165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:20,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.65726 samples/s/p 2:18:10 } +2024-07-30 03:50:23,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 389/ 3125], loss: 0.102, per_step_time: 1415ms, lr: 7.193513e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:23,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.65051 samples/s/p 2:18:18 } +2024-07-30 03:50:26,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 391/ 3125], loss: 0.454, per_step_time: 1413ms, lr: 7.190406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:26,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.65890 samples/s/p 2:18:02 } +2024-07-30 03:50:29,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 393/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 7.1872996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:29,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.66027 samples/s/p 2:17:58 } +2024-07-30 03:50:31,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 395/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 7.184192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:31,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.66125 samples/s/p 2:17:53 } +2024-07-30 03:50:34,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 397/ 3125], loss: 0.102, per_step_time: 1413ms, lr: 7.181084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:34,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.65909 samples/s/p 2:17:54 } +2024-07-30 03:50:37,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 399/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 7.177975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:37,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.66070 samples/s/p 2:17:48 } +2024-07-30 03:50:40,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 401/ 3125], loss: 0.318, per_step_time: 1412ms, lr: 7.174864e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:40,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.66235 samples/s/p 2:17:43 } +2024-07-30 03:50:43,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 403/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 7.1717536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:43,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.65863 samples/s/p 2:17:46 } +2024-07-30 03:50:46,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 405/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 7.168641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:46,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.66025 samples/s/p 2:17:41 } +2024-07-30 03:50:48,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 407/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 7.1655268e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:48,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.65800 samples/s/p 2:17:41 } +2024-07-30 03:50:51,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 409/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 7.162412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:51,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.65953 samples/s/p 2:17:36 } +2024-07-30 03:50:54,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 411/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 7.1592967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:54,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.66160 samples/s/p 2:17:30 } +2024-07-30 03:50:57,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 413/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 7.1561794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:57,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.66008 samples/s/p 2:17:30 } +2024-07-30 03:51:00,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 415/ 3125], loss: 0.315, per_step_time: 1412ms, lr: 7.1530612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:00,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.66235 samples/s/p 2:17:23 } +2024-07-30 03:51:03,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 417/ 3125], loss: 0.052, per_step_time: 1413ms, lr: 7.149943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:03,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.66125 samples/s/p 2:17:22 } +2024-07-30 03:51:05,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 419/ 3125], loss: 0.373, per_step_time: 1413ms, lr: 7.146824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:05,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.65813 samples/s/p 2:17:24 } +2024-07-30 03:51:08,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 421/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 7.1437034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:08,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.66171 samples/s/p 2:17:16 } +2024-07-30 03:51:11,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 423/ 3125], loss: 0.341, per_step_time: 1413ms, lr: 7.1405816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:11,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.65891 samples/s/p 2:17:17 } +2024-07-30 03:51:14,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 425/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 7.137458e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:14,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.66091 samples/s/p 2:17:11 } +2024-07-30 03:51:17,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 427/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 7.1343343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:17,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.65872 samples/s/p 2:17:12 } +2024-07-30 03:51:20,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 429/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 7.131209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:20,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.65909 samples/s/p 2:17:08 } +2024-07-30 03:51:22,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 431/ 3125], loss: 0.251, per_step_time: 1414ms, lr: 7.128083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:22,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.65696 samples/s/p 2:17:09 } +2024-07-30 03:51:25,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 433/ 3125], loss: 0.285, per_step_time: 1414ms, lr: 7.1249565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:25,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.65757 samples/s/p 2:17:05 } +2024-07-30 03:51:28,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 435/ 3125], loss: 0.294, per_step_time: 1414ms, lr: 7.1218287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:28,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.65535 samples/s/p 2:17:05 } +2024-07-30 03:51:31,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 437/ 3125], loss: 0.260, per_step_time: 1414ms, lr: 7.1187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:31,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.65387 samples/s/p 2:17:05 } +2024-07-30 03:51:34,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 439/ 3125], loss: 0.207, per_step_time: 1414ms, lr: 7.11557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:34,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |███████████████████ | 5.65696 samples/s/p 2:16:57 } +2024-07-30 03:51:37,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 441/ 3125], loss: 0.232, per_step_time: 1414ms, lr: 7.1124396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:37,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |███████████████████ | 5.65635 samples/s/p 2:16:55 } +2024-07-30 03:51:39,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 443/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 7.109307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:39,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.66062 samples/s/p 2:16:46 } +2024-07-30 03:51:42,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 445/ 3125], loss: 0.195, per_step_time: 1412ms, lr: 7.106174e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:42,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.66238 samples/s/p 2:16:41 } +2024-07-30 03:51:45,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 447/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 7.103039e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:45,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.65912 samples/s/p 2:16:43 } +2024-07-30 03:51:48,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 449/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 7.0999045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:48,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.65844 samples/s/p 2:16:41 } +2024-07-30 03:51:51,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 451/ 3125], loss: 0.402, per_step_time: 1412ms, lr: 7.0967685e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:51,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.66203 samples/s/p 2:16:33 } +2024-07-30 03:51:54,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 453/ 3125], loss: 0.338, per_step_time: 1414ms, lr: 7.093632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:54,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.65631 samples/s/p 2:16:38 } +2024-07-30 03:51:56,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 455/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 7.0904944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:56,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.66061 samples/s/p 2:16:29 } +2024-07-30 03:51:59,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 457/ 3125], loss: 0.281, per_step_time: 1412ms, lr: 7.0873557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:59,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.66286 samples/s/p 2:16:23 } +2024-07-30 03:52:02,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 459/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 7.0842143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:02,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.65969 samples/s/p 2:16:25 } +2024-07-30 03:52:05,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 461/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 7.081074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:05,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.66110 samples/s/p 2:16:20 } +2024-07-30 03:52:08,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 463/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 7.077932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:08,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.66090 samples/s/p 2:16:18 } +2024-07-30 03:52:11,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 465/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 7.0747888e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:11,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.66101 samples/s/p 2:16:15 } +2024-07-30 03:52:13,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 467/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 7.071645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:13,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.65833 samples/s/p 2:16:16 } +2024-07-30 03:52:16,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 469/ 3125], loss: 0.520, per_step_time: 1413ms, lr: 7.0685005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:16,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.65987 samples/s/p 2:16:11 } +2024-07-30 03:52:19,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 471/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 7.0653537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:19,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.65978 samples/s/p 2:16:08 } +2024-07-30 03:52:22,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 473/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 7.0622073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:22,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.65952 samples/s/p 2:16:06 } +2024-07-30 03:52:25,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 475/ 3125], loss: 0.113, per_step_time: 1413ms, lr: 7.0590595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:25,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.65830 samples/s/p 2:16:04 } +2024-07-30 03:52:28,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 477/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 7.055911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:28,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.65936 samples/s/p 2:16:00 } +2024-07-30 03:52:30,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 479/ 3125], loss: 0.259, per_step_time: 1415ms, lr: 7.0527603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:30,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.65269 samples/s/p 2:16:07 } +2024-07-30 03:52:33,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 481/ 3125], loss: 0.377, per_step_time: 1413ms, lr: 7.0496094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:33,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.65832 samples/s/p 2:15:56 } +2024-07-30 03:52:36,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 483/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 7.046458e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:36,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.66057 samples/s/p 2:15:50 } +2024-07-30 03:52:39,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 485/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 7.043305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:39,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.66060 samples/s/p 2:15:47 } +2024-07-30 03:52:42,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 487/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 7.040151e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:42,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.66023 samples/s/p 2:15:45 } +2024-07-30 03:52:45,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 489/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 7.036997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:45,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.66073 samples/s/p 2:15:41 } +2024-07-30 03:52:47,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 491/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 7.033841e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:47,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.65979 samples/s/p 2:15:40 } +2024-07-30 03:52:50,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 493/ 3125], loss: 0.356, per_step_time: 1413ms, lr: 7.0306837e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:50,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.66086 samples/s/p 2:15:35 } +2024-07-30 03:52:53,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 495/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 7.0275264e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:53,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.66160 samples/s/p 2:15:31 } +2024-07-30 03:52:56,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 497/ 3125], loss: 0.416, per_step_time: 1413ms, lr: 7.0243677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:56,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.66134 samples/s/p 2:15:29 } +2024-07-30 03:52:59,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 499/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 7.0212086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:59,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.66097 samples/s/p 2:15:27 } +2024-07-30 03:53:02,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 501/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 7.018047e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:02,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.65959 samples/s/p 2:15:26 } +2024-07-30 03:53:04,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 503/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 7.014886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:04,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.65593 samples/s/p 2:15:28 } +2024-07-30 03:53:07,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 505/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 7.0117235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:07,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.65914 samples/s/p 2:15:21 } +2024-07-30 03:53:10,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 507/ 3125], loss: 0.252, per_step_time: 1412ms, lr: 7.0085603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:10,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.66186 samples/s/p 2:15:14 } +2024-07-30 03:53:13,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 509/ 3125], loss: 0.103, per_step_time: 1414ms, lr: 7.0053957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:13,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.65479 samples/s/p 2:15:21 } +2024-07-30 03:53:16,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 511/ 3125], loss: 0.140, per_step_time: 1414ms, lr: 7.0022306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:16,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.65501 samples/s/p 2:15:18 } +2024-07-30 03:53:19,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 513/ 3125], loss: 0.333, per_step_time: 1414ms, lr: 6.9990638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:19,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.65743 samples/s/p 2:15:12 } +2024-07-30 03:53:21,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 515/ 3125], loss: 0.159, per_step_time: 1412ms, lr: 6.9958965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:21,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.66180 samples/s/p 2:15:03 } +2024-07-30 03:53:24,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 517/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 6.9927287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:24,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.66017 samples/s/p 2:15:02 } +2024-07-30 03:53:27,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 519/ 3125], loss: 0.437, per_step_time: 1413ms, lr: 6.9895596e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:27,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.66086 samples/s/p 2:14:59 } +2024-07-30 03:53:30,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 521/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 6.9863895e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:30,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.65965 samples/s/p 2:14:58 } +2024-07-30 03:53:33,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 523/ 3125], loss: 0.258, per_step_time: 1420ms, lr: 6.983218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:33,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.63024 samples/s/p 2:15:37 } +2024-07-30 03:53:36,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 525/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 6.980046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:36,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.65930 samples/s/p 2:14:52 } +2024-07-30 03:53:38,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 527/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 6.976873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:38,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.66010 samples/s/p 2:14:48 } +2024-07-30 03:53:41,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 529/ 3125], loss: 0.346, per_step_time: 1413ms, lr: 6.9736993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:41,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.65882 samples/s/p 2:14:47 } +2024-07-30 03:53:44,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 531/ 3125], loss: 0.420, per_step_time: 1413ms, lr: 6.9705247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:44,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.65901 samples/s/p 2:14:44 } +2024-07-30 03:53:47,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 533/ 3125], loss: 0.182, per_step_time: 1414ms, lr: 6.967349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:47,448 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.65764 samples/s/p 2:14:43 } +2024-07-30 03:53:50,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 535/ 3125], loss: 0.098, per_step_time: 1415ms, lr: 6.964172e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:50,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.65362 samples/s/p 2:14:46 } +2024-07-30 03:53:53,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 537/ 3125], loss: 0.678, per_step_time: 1413ms, lr: 6.9609937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:53,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.65826 samples/s/p 2:14:37 } +2024-07-30 03:53:55,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 539/ 3125], loss: 0.108, per_step_time: 1413ms, lr: 6.957816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:55,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.65956 samples/s/p 2:14:32 } +2024-07-30 03:53:58,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 541/ 3125], loss: 0.110, per_step_time: 1413ms, lr: 6.9546363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:58,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.65890 samples/s/p 2:14:30 } +2024-07-30 03:54:01,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 543/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 6.9514554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:01,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.65986 samples/s/p 2:14:26 } +2024-07-30 03:54:04,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 545/ 3125], loss: 0.292, per_step_time: 1413ms, lr: 6.9482744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:04,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.65970 samples/s/p 2:14:24 } +2024-07-30 03:54:07,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 547/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 6.945091e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:07,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.65981 samples/s/p 2:14:21 } +2024-07-30 03:54:10,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 549/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 6.9419084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:10,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.66105 samples/s/p 2:14:16 } +2024-07-30 03:54:12,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 551/ 3125], loss: 0.234, per_step_time: 1412ms, lr: 6.9387243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:12,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.66195 samples/s/p 2:14:12 } +2024-07-30 03:54:15,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 553/ 3125], loss: 0.216, per_step_time: 1418ms, lr: 6.935539e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:15,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.64146 samples/s/p 2:14:38 } +2024-07-30 03:54:18,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 555/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 6.9323532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:18,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.66142 samples/s/p 2:14:07 } +2024-07-30 03:54:21,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 557/ 3125], loss: 0.150, per_step_time: 1414ms, lr: 6.929166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:21,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.65767 samples/s/p 2:14:09 } +2024-07-30 03:54:24,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 559/ 3125], loss: 0.148, per_step_time: 1413ms, lr: 6.9259777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:24,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.65987 samples/s/p 2:14:04 } +2024-07-30 03:54:27,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 561/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 6.9227895e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:27,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.66037 samples/s/p 2:14:00 } +2024-07-30 03:54:29,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 563/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 6.9195994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:29,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.65906 samples/s/p 2:13:59 } +2024-07-30 03:54:32,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 565/ 3125], loss: 0.587, per_step_time: 1412ms, lr: 6.916409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:32,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.66172 samples/s/p 2:13:52 } +2024-07-30 03:54:35,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 567/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 6.913218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:35,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.65782 samples/s/p 2:13:55 } +2024-07-30 03:54:38,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 569/ 3125], loss: 0.142, per_step_time: 1414ms, lr: 6.9100247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:38,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.65742 samples/s/p 2:13:53 } +2024-07-30 03:54:41,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 571/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 6.9068315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:41,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.65928 samples/s/p 2:13:47 } +2024-07-30 03:54:44,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 573/ 3125], loss: 0.064, per_step_time: 1417ms, lr: 6.9036373e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:44,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.64547 samples/s/p 2:14:04 } +2024-07-30 03:54:46,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 575/ 3125], loss: 0.199, per_step_time: 1412ms, lr: 6.9004423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:46,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.66192 samples/s/p 2:13:38 } +2024-07-30 03:54:49,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 577/ 3125], loss: 0.460, per_step_time: 1413ms, lr: 6.8972463e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:49,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.65865 samples/s/p 2:13:40 } +2024-07-30 03:54:52,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 579/ 3125], loss: 0.125, per_step_time: 1413ms, lr: 6.894049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:52,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.66110 samples/s/p 2:13:33 } +2024-07-30 03:54:55,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 581/ 3125], loss: 0.071, per_step_time: 1413ms, lr: 6.8908503e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:55,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.66106 samples/s/p 2:13:31 } +2024-07-30 03:54:58,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 583/ 3125], loss: 0.261, per_step_time: 1415ms, lr: 6.887652e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:58,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.65335 samples/s/p 2:13:39 } +2024-07-30 03:55:01,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 585/ 3125], loss: 0.255, per_step_time: 1414ms, lr: 6.8844524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:01,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.65768 samples/s/p 2:13:30 } +2024-07-30 03:55:03,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 587/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 6.881252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:03,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.66126 samples/s/p 2:13:22 } +2024-07-30 03:55:06,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 589/ 3125], loss: 0.097, per_step_time: 1414ms, lr: 6.8780505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:06,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.65759 samples/s/p 2:13:24 } +2024-07-30 03:55:09,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 591/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 6.8748477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:09,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.65955 samples/s/p 2:13:19 } +2024-07-30 03:55:12,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 593/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 6.8716445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:12,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.66041 samples/s/p 2:13:15 } +2024-07-30 03:55:15,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 595/ 3125], loss: 0.161, per_step_time: 1418ms, lr: 6.8684403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:15,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.64091 samples/s/p 2:13:39 } +2024-07-30 03:55:18,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 597/ 3125], loss: 0.225, per_step_time: 1414ms, lr: 6.8652353e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:18,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.65459 samples/s/p 2:13:17 } +2024-07-30 03:55:21,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 599/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 6.8620293e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:21,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.66030 samples/s/p 2:13:06 } +2024-07-30 03:55:23,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 601/ 3125], loss: 0.352, per_step_time: 1414ms, lr: 6.858822e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:23,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.65696 samples/s/p 2:13:08 } +2024-07-30 03:55:26,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 603/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 6.855614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:26,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.65842 samples/s/p 2:13:03 } +2024-07-30 03:55:29,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 605/ 3125], loss: 0.471, per_step_time: 1413ms, lr: 6.852406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:29,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.66017 samples/s/p 2:12:58 } +2024-07-30 03:55:32,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 607/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 6.8491963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:32,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.65901 samples/s/p 2:12:57 } +2024-07-30 03:55:35,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 609/ 3125], loss: 0.238, per_step_time: 1414ms, lr: 6.8459854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:35,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.65704 samples/s/p 2:12:57 } +2024-07-30 03:55:38,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 611/ 3125], loss: 0.297, per_step_time: 1414ms, lr: 6.8427744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:38,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.65692 samples/s/p 2:12:54 } +2024-07-30 03:55:40,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 613/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 6.8395625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:40,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.65949 samples/s/p 2:12:48 } +2024-07-30 03:55:43,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 615/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 6.836349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:43,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.65902 samples/s/p 2:12:46 } +2024-07-30 03:55:46,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 617/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 6.833135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:46,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.66022 samples/s/p 2:12:41 } +2024-07-30 03:55:49,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 619/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 6.829921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:49,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.66064 samples/s/p 2:12:38 } +2024-07-30 03:55:52,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 621/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 6.826705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:52,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |███████████████████ | 5.66065 samples/s/p 2:12:35 } +2024-07-30 03:55:55,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 623/ 3125], loss: 0.142, per_step_time: 1413ms, lr: 6.823488e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:55,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |███████████████████ | 5.66046 samples/s/p 2:12:32 } +2024-07-30 03:55:57,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 625/ 3125], loss: 0.120, per_step_time: 1413ms, lr: 6.8202708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:57,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.66028 samples/s/p 2:12:30 } +2024-07-30 03:56:00,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 627/ 3125], loss: 0.379, per_step_time: 1413ms, lr: 6.817053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:00,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.65823 samples/s/p 2:12:30 } +2024-07-30 03:56:03,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 629/ 3125], loss: 0.368, per_step_time: 1413ms, lr: 6.8138334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:03,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.65924 samples/s/p 2:12:25 } +2024-07-30 03:56:06,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 631/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 6.8106133e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:06,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.65810 samples/s/p 2:12:24 } +2024-07-30 03:56:09,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 633/ 3125], loss: 0.124, per_step_time: 1414ms, lr: 6.8073928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:09,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.65703 samples/s/p 2:12:23 } +2024-07-30 03:56:12,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 635/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 6.804171e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:12,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.65408 samples/s/p 2:12:24 } +2024-07-30 03:56:14,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 637/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 6.8009476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:14,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.65860 samples/s/p 2:12:15 } +2024-07-30 03:56:17,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 639/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 6.7977244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:17,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.65809 samples/s/p 2:12:13 } +2024-07-30 03:56:20,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 641/ 3125], loss: 0.334, per_step_time: 1413ms, lr: 6.7945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:20,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.66121 samples/s/p 2:12:06 } +2024-07-30 03:56:23,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 643/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 6.7912756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:23,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.66064 samples/s/p 2:12:04 } +2024-07-30 03:56:26,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 645/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 6.788049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:26,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.65967 samples/s/p 2:12:02 } +2024-07-30 03:56:29,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 647/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 6.7848214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:29,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.65916 samples/s/p 2:12:00 } +2024-07-30 03:56:31,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 649/ 3125], loss: 0.085, per_step_time: 1417ms, lr: 6.7815945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:31,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.64263 samples/s/p 2:12:20 } +2024-07-30 03:56:34,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 651/ 3125], loss: 0.368, per_step_time: 1413ms, lr: 6.7783653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:34,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.65796 samples/s/p 2:11:56 } +2024-07-30 03:56:37,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 653/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 6.7751357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:37,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.65977 samples/s/p 2:11:51 } +2024-07-30 03:56:40,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 655/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 6.7719066e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:40,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.66105 samples/s/p 2:11:46 } +2024-07-30 03:56:43,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 657/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 6.768675e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:43,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.66093 samples/s/p 2:11:43 } +2024-07-30 03:56:46,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 659/ 3125], loss: 0.151, per_step_time: 1413ms, lr: 6.7654423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:46,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.65978 samples/s/p 2:11:42 } +2024-07-30 03:56:48,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 661/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 6.76221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:48,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.66033 samples/s/p 2:11:39 } +2024-07-30 03:56:51,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 663/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 6.7589763e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:51,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.65873 samples/s/p 2:11:38 } +2024-07-30 03:56:54,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 665/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 6.7557417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:54,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.66070 samples/s/p 2:11:33 } +2024-07-30 03:56:57,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 667/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 6.752506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:57,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.65987 samples/s/p 2:11:31 } +2024-07-30 03:57:00,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 669/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 6.7492706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:00,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.65980 samples/s/p 2:11:28 } +2024-07-30 03:57:03,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 671/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 6.7460333e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:03,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.66038 samples/s/p 2:11:24 } +2024-07-30 03:57:05,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 673/ 3125], loss: 0.298, per_step_time: 1412ms, lr: 6.742795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:05,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.66210 samples/s/p 2:11:19 } +2024-07-30 03:57:08,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 675/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 6.7395567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:08,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.65804 samples/s/p 2:11:22 } +2024-07-30 03:57:11,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 677/ 3125], loss: 0.427, per_step_time: 1414ms, lr: 6.736317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:11,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.65763 samples/s/p 2:11:20 } +2024-07-30 03:57:14,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 679/ 3125], loss: 0.160, per_step_time: 1414ms, lr: 6.733077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:14,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.65406 samples/s/p 2:11:22 } +2024-07-30 03:57:17,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 681/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 6.7298356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:17,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.65917 samples/s/p 2:11:12 } +2024-07-30 03:57:20,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 683/ 3125], loss: 0.352, per_step_time: 1414ms, lr: 6.7265933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:20,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.65624 samples/s/p 2:11:13 } +2024-07-30 03:57:22,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 685/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 6.723351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:22,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.66007 samples/s/p 2:11:05 } +2024-07-30 03:57:25,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 687/ 3125], loss: 0.426, per_step_time: 1413ms, lr: 6.7201063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:25,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.65901 samples/s/p 2:11:04 } +2024-07-30 03:57:28,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 689/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 6.7168626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:28,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.65985 samples/s/p 2:11:00 } +2024-07-30 03:57:31,405 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 691/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 6.7136175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:31,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.66064 samples/s/p 2:10:56 } +2024-07-30 03:57:34,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 693/ 3125], loss: 0.261, per_step_time: 1414ms, lr: 6.710371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:34,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.65519 samples/s/p 2:11:01 } +2024-07-30 03:57:37,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 695/ 3125], loss: 0.328, per_step_time: 1417ms, lr: 6.707124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:37,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.64489 samples/s/p 2:11:12 } +2024-07-30 03:57:39,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 697/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 6.703876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:39,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.65978 samples/s/p 2:10:49 } +2024-07-30 03:57:42,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 699/ 3125], loss: 0.187, per_step_time: 1414ms, lr: 6.700628e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:42,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.65730 samples/s/p 2:10:49 } +2024-07-30 03:57:45,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 701/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 6.6973794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:45,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.66107 samples/s/p 2:10:41 } +2024-07-30 03:57:48,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 703/ 3125], loss: 0.323, per_step_time: 1414ms, lr: 6.6941284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:48,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.65655 samples/s/p 2:10:45 } +2024-07-30 03:57:51,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 705/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 6.690877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:51,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.65941 samples/s/p 2:10:38 } +2024-07-30 03:57:54,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 707/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 6.6876255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:54,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.66119 samples/s/p 2:10:32 } +2024-07-30 03:57:56,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 709/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 6.6843727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:56,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.66161 samples/s/p 2:10:29 } +2024-07-30 03:57:59,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 711/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 6.681119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:59,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.66016 samples/s/p 2:10:28 } +2024-07-30 03:58:02,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 713/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 6.6778657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:02,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.66029 samples/s/p 2:10:25 } +2024-07-30 03:58:05,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 715/ 3125], loss: 0.368, per_step_time: 1412ms, lr: 6.67461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:05,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.66203 samples/s/p 2:10:20 } +2024-07-30 03:58:08,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 717/ 3125], loss: 0.139, per_step_time: 1412ms, lr: 6.671354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:08,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.66255 samples/s/p 2:10:16 } +2024-07-30 03:58:11,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 719/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 6.6680977e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:11,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.65995 samples/s/p 2:10:17 } +2024-07-30 03:58:13,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 721/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 6.6648404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:13,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.65934 samples/s/p 2:10:15 } +2024-07-30 03:58:16,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 723/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 6.6615817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:16,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.65808 samples/s/p 2:10:14 } +2024-07-30 03:58:19,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 725/ 3125], loss: 0.420, per_step_time: 1416ms, lr: 6.6583234e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:19,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.64800 samples/s/p 2:10:25 } +2024-07-30 03:58:22,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 727/ 3125], loss: 0.105, per_step_time: 1414ms, lr: 6.6550633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:22,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.65596 samples/s/p 2:10:11 } +2024-07-30 03:58:25,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 729/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 6.6518032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:25,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.66088 samples/s/p 2:10:02 } +2024-07-30 03:58:28,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 731/ 3125], loss: 0.259, per_step_time: 1412ms, lr: 6.648541e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:28,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.66211 samples/s/p 2:09:57 } +2024-07-30 03:58:30,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 733/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 6.6452794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:30,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.66079 samples/s/p 2:09:56 } +2024-07-30 03:58:33,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 735/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 6.6420166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:33,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.66166 samples/s/p 2:09:52 } +2024-07-30 03:58:36,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 737/ 3125], loss: 0.189, per_step_time: 1414ms, lr: 6.6387524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:36,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.65580 samples/s/p 2:09:58 } +2024-07-30 03:58:39,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 739/ 3125], loss: 0.179, per_step_time: 1414ms, lr: 6.6354874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:39,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.65642 samples/s/p 2:09:54 } +2024-07-30 03:58:42,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 741/ 3125], loss: 0.483, per_step_time: 1413ms, lr: 6.632223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:42,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.65785 samples/s/p 2:09:49 } +2024-07-30 03:58:45,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 743/ 3125], loss: 0.356, per_step_time: 1414ms, lr: 6.6289567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:45,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.65741 samples/s/p 2:09:47 } +2024-07-30 03:58:47,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 745/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 6.62569e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:47,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.66068 samples/s/p 2:09:39 } +2024-07-30 03:58:50,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 747/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 6.622422e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:50,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.65879 samples/s/p 2:09:39 } +2024-07-30 03:58:53,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 749/ 3125], loss: 0.377, per_step_time: 1413ms, lr: 6.6191533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:53,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.66011 samples/s/p 2:09:35 } +2024-07-30 03:58:56,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 751/ 3125], loss: 0.137, per_step_time: 1413ms, lr: 6.6158846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:56,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.66158 samples/s/p 2:09:30 } +2024-07-30 03:58:59,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 753/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 6.612614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:59,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.66106 samples/s/p 2:09:28 } +2024-07-30 03:59:02,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 755/ 3125], loss: 0.384, per_step_time: 1413ms, lr: 6.6093444e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:02,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.66044 samples/s/p 2:09:26 } +2024-07-30 03:59:04,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 757/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 6.6060725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:04,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.66127 samples/s/p 2:09:22 } +2024-07-30 03:59:07,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 759/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 6.6028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:07,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.66154 samples/s/p 2:09:19 } +2024-07-30 03:59:10,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 761/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 6.599527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:10,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.66164 samples/s/p 2:09:16 } +2024-07-30 03:59:13,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 763/ 3125], loss: 0.551, per_step_time: 1413ms, lr: 6.5962536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:13,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.65964 samples/s/p 2:09:15 } +2024-07-30 03:59:16,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 765/ 3125], loss: 0.331, per_step_time: 1412ms, lr: 6.5929794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:16,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.66173 samples/s/p 2:09:10 } +2024-07-30 03:59:19,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 767/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 6.5897034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:19,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.65914 samples/s/p 2:09:11 } +2024-07-30 03:59:21,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 769/ 3125], loss: 0.385, per_step_time: 1414ms, lr: 6.5864274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:21,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.65753 samples/s/p 2:09:10 } +2024-07-30 03:59:24,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 771/ 3125], loss: 0.358, per_step_time: 1415ms, lr: 6.5831505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:24,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.65298 samples/s/p 2:09:13 } +2024-07-30 03:59:27,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 773/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 6.5798736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:27,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.65937 samples/s/p 2:09:02 } +2024-07-30 03:59:30,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 775/ 3125], loss: 0.327, per_step_time: 1413ms, lr: 6.5765944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:30,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.66136 samples/s/p 2:08:56 } +2024-07-30 03:59:33,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 777/ 3125], loss: 0.330, per_step_time: 1413ms, lr: 6.5733157e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:33,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.65857 samples/s/p 2:08:57 } +2024-07-30 03:59:36,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 779/ 3125], loss: 0.209, per_step_time: 1414ms, lr: 6.570036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:36,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.65763 samples/s/p 2:08:56 } +2024-07-30 03:59:38,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 781/ 3125], loss: 0.368, per_step_time: 1412ms, lr: 6.5667555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:38,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.66213 samples/s/p 2:08:47 } +2024-07-30 03:59:41,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 783/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 6.5634736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:41,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.66005 samples/s/p 2:08:47 } +2024-07-30 03:59:44,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 785/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 6.560192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:44,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.65882 samples/s/p 2:08:45 } +2024-07-30 03:59:47,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 787/ 3125], loss: 0.200, per_step_time: 1414ms, lr: 6.556909e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:47,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.65519 samples/s/p 2:08:48 } +2024-07-30 03:59:50,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 789/ 3125], loss: 0.394, per_step_time: 1413ms, lr: 6.553625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:50,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.65832 samples/s/p 2:08:41 } +2024-07-30 03:59:53,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 791/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 6.550342e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:53,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.66044 samples/s/p 2:08:35 } +2024-07-30 03:59:55,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 793/ 3125], loss: 0.298, per_step_time: 1414ms, lr: 6.5470563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:55,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.65663 samples/s/p 2:08:37 } +2024-07-30 03:59:58,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 795/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 6.5437703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:58,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.66074 samples/s/p 2:08:29 } +2024-07-30 04:00:01,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 797/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 6.540484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:01,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.65919 samples/s/p 2:08:28 } +2024-07-30 04:00:04,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 799/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 6.5371964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:04,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.65997 samples/s/p 2:08:24 } +2024-07-30 04:00:07,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 801/ 3125], loss: 0.258, per_step_time: 1445ms, lr: 6.5339086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:07,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.53614 samples/s/p 2:11:14 } +2024-07-30 04:00:10,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 803/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 6.53062e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:10,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.66056 samples/s/p 2:08:18 } +2024-07-30 04:00:13,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 805/ 3125], loss: 0.134, per_step_time: 1413ms, lr: 6.5273302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:13,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.65837 samples/s/p 2:08:18 } +2024-07-30 04:00:15,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 807/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 6.5240406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:15,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.66048 samples/s/p 2:08:12 } +2024-07-30 04:00:18,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 809/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 6.5207496e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:18,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |████████████████████ | 5.65978 samples/s/p 2:08:10 } +2024-07-30 04:00:21,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 811/ 3125], loss: 0.194, per_step_time: 1412ms, lr: 6.5174577e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:21,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |████████████████████ | 5.66253 samples/s/p 2:08:04 } +2024-07-30 04:00:24,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 813/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 6.5141653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:24,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.66036 samples/s/p 2:08:04 } +2024-07-30 04:00:27,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 815/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 6.510872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:27,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.66056 samples/s/p 2:08:01 } +2024-07-30 04:00:30,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 817/ 3125], loss: 0.292, per_step_time: 1413ms, lr: 6.507578e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:30,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.65963 samples/s/p 2:07:59 } +2024-07-30 04:00:32,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 819/ 3125], loss: 0.129, per_step_time: 1413ms, lr: 6.504284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:32,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.66059 samples/s/p 2:07:55 } +2024-07-30 04:00:35,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 821/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 6.500989e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:35,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.66127 samples/s/p 2:07:51 } +2024-07-30 04:00:38,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 823/ 3125], loss: 0.091, per_step_time: 1413ms, lr: 6.497693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:38,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.65807 samples/s/p 2:07:53 } +2024-07-30 04:00:41,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 825/ 3125], loss: 0.179, per_step_time: 1412ms, lr: 6.494396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:41,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.66366 samples/s/p 2:07:42 } +2024-07-30 04:00:44,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 827/ 3125], loss: 0.490, per_step_time: 1413ms, lr: 6.4910982e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:44,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.65957 samples/s/p 2:07:45 } +2024-07-30 04:00:47,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 829/ 3125], loss: 0.243, per_step_time: 1412ms, lr: 6.4878004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:47,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.66182 samples/s/p 2:07:39 } +2024-07-30 04:00:49,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 831/ 3125], loss: 0.435, per_step_time: 1413ms, lr: 6.4845017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:49,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.66011 samples/s/p 2:07:39 } +2024-07-30 04:00:52,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 833/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 6.481202e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:52,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.66088 samples/s/p 2:07:35 } +2024-07-30 04:00:55,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 835/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 6.4779024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:55,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.65939 samples/s/p 2:07:34 } +2024-07-30 04:00:58,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 837/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 6.474601e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:58,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.66011 samples/s/p 2:07:30 } +2024-07-30 04:01:01,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 839/ 3125], loss: 0.248, per_step_time: 1415ms, lr: 6.4712985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:01,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.65364 samples/s/p 2:07:36 } +2024-07-30 04:01:04,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 841/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 6.4679966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:04,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.66065 samples/s/p 2:07:24 } +2024-07-30 04:01:06,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 843/ 3125], loss: 0.422, per_step_time: 1414ms, lr: 6.464694e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:06,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.65618 samples/s/p 2:07:27 } +2024-07-30 04:01:09,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 845/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 6.4613905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:09,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.66161 samples/s/p 2:07:17 } +2024-07-30 04:01:12,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 847/ 3125], loss: 0.428, per_step_time: 1414ms, lr: 6.4580854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:12,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.65676 samples/s/p 2:07:21 } +2024-07-30 04:01:15,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 849/ 3125], loss: 0.190, per_step_time: 1414ms, lr: 6.4547808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:15,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.65678 samples/s/p 2:07:18 } +2024-07-30 04:01:18,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 851/ 3125], loss: 0.377, per_step_time: 1414ms, lr: 6.4514747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:18,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.65568 samples/s/p 2:07:16 } +2024-07-30 04:01:21,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 853/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 6.448168e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:21,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.65377 samples/s/p 2:07:16 } +2024-07-30 04:01:23,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 855/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 6.4448614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:23,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.66002 samples/s/p 2:07:05 } +2024-07-30 04:01:26,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 857/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 6.4415535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:26,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.66114 samples/s/p 2:07:01 } +2024-07-30 04:01:29,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 859/ 3125], loss: 0.122, per_step_time: 1413ms, lr: 6.4382443e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:29,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.65847 samples/s/p 2:07:01 } +2024-07-30 04:01:32,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 861/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 6.434935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:32,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.66045 samples/s/p 2:06:56 } +2024-07-30 04:01:35,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 863/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 6.4316255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:35,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.66089 samples/s/p 2:06:52 } +2024-07-30 04:01:38,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 865/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 6.428315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:38,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.65874 samples/s/p 2:06:53 } +2024-07-30 04:01:40,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 867/ 3125], loss: 0.485, per_step_time: 1414ms, lr: 6.425004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:40,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.65570 samples/s/p 2:06:54 } +2024-07-30 04:01:43,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 869/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 6.4216915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:43,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.65872 samples/s/p 2:06:47 } +2024-07-30 04:01:46,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 871/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 6.4183782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:46,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.66057 samples/s/p 2:06:42 } +2024-07-30 04:01:49,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 873/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 6.4150654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:49,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.65962 samples/s/p 2:06:40 } +2024-07-30 04:01:52,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 875/ 3125], loss: 0.493, per_step_time: 1413ms, lr: 6.411751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:52,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.65992 samples/s/p 2:06:37 } +2024-07-30 04:01:55,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 877/ 3125], loss: 0.635, per_step_time: 1413ms, lr: 6.408436e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:55,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.66055 samples/s/p 2:06:33 } +2024-07-30 04:01:57,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 879/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 6.4051214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:57,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.66047 samples/s/p 2:06:30 } +2024-07-30 04:02:00,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 881/ 3125], loss: 0.363, per_step_time: 1413ms, lr: 6.401805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:00,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.66079 samples/s/p 2:06:27 } +2024-07-30 04:02:03,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 883/ 3125], loss: 0.295, per_step_time: 1425ms, lr: 6.398488e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:03,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.61097 samples/s/p 2:07:32 } +2024-07-30 04:02:06,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 885/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 6.3951707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:06,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.66142 samples/s/p 2:06:21 } +2024-07-30 04:02:09,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 887/ 3125], loss: 0.270, per_step_time: 1414ms, lr: 6.391853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:09,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.65584 samples/s/p 2:06:25 } +2024-07-30 04:02:12,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 889/ 3125], loss: 0.163, per_step_time: 1417ms, lr: 6.388534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:12,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.64495 samples/s/p 2:06:37 } +2024-07-30 04:02:14,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 891/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 6.385215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:14,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.65886 samples/s/p 2:06:16 } +2024-07-30 04:02:17,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 893/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 6.3818943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:17,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.65963 samples/s/p 2:06:12 } +2024-07-30 04:02:20,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 895/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 6.378574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:20,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.66031 samples/s/p 2:06:08 } +2024-07-30 04:02:23,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 897/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 6.3752523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:23,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.66152 samples/s/p 2:06:04 } +2024-07-30 04:02:26,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 899/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 6.371931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:26,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.65971 samples/s/p 2:06:03 } +2024-07-30 04:02:29,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 901/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 6.3686084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:29,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.66088 samples/s/p 2:05:59 } +2024-07-30 04:02:31,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 903/ 3125], loss: 0.049, per_step_time: 1413ms, lr: 6.3652847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:31,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.66052 samples/s/p 2:05:56 } +2024-07-30 04:02:34,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 905/ 3125], loss: 0.419, per_step_time: 1413ms, lr: 6.36196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:34,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.66125 samples/s/p 2:05:53 } +2024-07-30 04:02:37,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 907/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 6.358636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:37,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.65888 samples/s/p 2:05:53 } +2024-07-30 04:02:40,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 909/ 3125], loss: 0.149, per_step_time: 1425ms, lr: 6.3553107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:40,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.61056 samples/s/p 2:06:55 } +2024-07-30 04:02:43,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 911/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 6.3519847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:43,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.66144 samples/s/p 2:05:44 } +2024-07-30 04:02:46,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 913/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 6.3486586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:46,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.66127 samples/s/p 2:05:41 } +2024-07-30 04:02:48,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 915/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 6.345331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:48,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.66124 samples/s/p 2:05:38 } +2024-07-30 04:02:51,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 917/ 3125], loss: 0.467, per_step_time: 1413ms, lr: 6.342003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:51,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.65815 samples/s/p 2:05:40 } +2024-07-30 04:02:54,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 919/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 6.338674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:54,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.65889 samples/s/p 2:05:36 } +2024-07-30 04:02:57,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 921/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 6.3353455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:57,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.66131 samples/s/p 2:05:30 } +2024-07-30 04:03:00,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 923/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 6.332016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:00,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.66024 samples/s/p 2:05:29 } +2024-07-30 04:03:03,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 925/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 6.3286852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:03,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.65985 samples/s/p 2:05:26 } +2024-07-30 04:03:05,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 927/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 6.3253538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:05,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.65920 samples/s/p 2:05:24 } +2024-07-30 04:03:08,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 929/ 3125], loss: 0.325, per_step_time: 1414ms, lr: 6.3220227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:08,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.65550 samples/s/p 2:05:26 } +2024-07-30 04:03:11,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 931/ 3125], loss: 0.215, per_step_time: 1414ms, lr: 6.318691e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:11,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.65755 samples/s/p 2:05:21 } +2024-07-30 04:03:14,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 933/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 6.315357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:14,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.65809 samples/s/p 2:05:17 } +2024-07-30 04:03:17,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 935/ 3125], loss: 0.239, per_step_time: 1414ms, lr: 6.3120237e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:17,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.65488 samples/s/p 2:05:19 } +2024-07-30 04:03:20,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 937/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 6.308689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:20,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.65926 samples/s/p 2:05:10 } +2024-07-30 04:03:22,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 939/ 3125], loss: 0.109, per_step_time: 1412ms, lr: 6.305355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:22,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.66235 samples/s/p 2:05:03 } +2024-07-30 04:03:25,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 941/ 3125], loss: 0.261, per_step_time: 1412ms, lr: 6.3020193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:25,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.66250 samples/s/p 2:05:00 } +2024-07-30 04:03:28,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 943/ 3125], loss: 0.153, per_step_time: 1419ms, lr: 6.2986833e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:28,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.63433 samples/s/p 2:05:35 } +2024-07-30 04:03:31,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 945/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 6.2953472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:31,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.65801 samples/s/p 2:05:00 } +2024-07-30 04:03:34,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 947/ 3125], loss: 0.170, per_step_time: 1418ms, lr: 6.2920094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:34,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.64055 samples/s/p 2:05:21 } +2024-07-30 04:03:37,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 949/ 3125], loss: 0.456, per_step_time: 1413ms, lr: 6.2886706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:37,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.66044 samples/s/p 2:04:52 } +2024-07-30 04:03:39,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 951/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 6.2853323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:39,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.66137 samples/s/p 2:04:47 } +2024-07-30 04:03:42,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 953/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 6.281994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:42,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.65858 samples/s/p 2:04:48 } +2024-07-30 04:03:45,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 955/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 6.2786535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:45,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.66085 samples/s/p 2:04:42 } +2024-07-30 04:03:48,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 957/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 6.2753134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:48,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.65799 samples/s/p 2:04:43 } +2024-07-30 04:03:51,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 959/ 3125], loss: 0.198, per_step_time: 1414ms, lr: 6.2719723e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:51,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.65637 samples/s/p 2:04:43 } +2024-07-30 04:03:54,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 961/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 6.2686304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:54,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.66157 samples/s/p 2:04:33 } +2024-07-30 04:03:56,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 963/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 6.2652884e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:56,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.66076 samples/s/p 2:04:31 } +2024-07-30 04:03:59,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 965/ 3125], loss: 0.207, per_step_time: 1412ms, lr: 6.2619456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:59,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.66177 samples/s/p 2:04:27 } +2024-07-30 04:04:02,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 967/ 3125], loss: 0.455, per_step_time: 1413ms, lr: 6.2586028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:02,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.65883 samples/s/p 2:04:28 } +2024-07-30 04:04:05,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 969/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 6.255258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:05,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.65986 samples/s/p 2:04:24 } +2024-07-30 04:04:08,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 971/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 6.2519143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:08,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.65939 samples/s/p 2:04:22 } +2024-07-30 04:04:11,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 973/ 3125], loss: 0.444, per_step_time: 1413ms, lr: 6.2485683e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:11,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.65820 samples/s/p 2:04:21 } +2024-07-30 04:04:13,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 975/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 6.245223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:13,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.66039 samples/s/p 2:04:15 } +2024-07-30 04:04:16,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 977/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 6.2418762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:16,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.66054 samples/s/p 2:04:12 } +2024-07-30 04:04:19,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 979/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 6.2385297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:19,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.65952 samples/s/p 2:04:10 } +2024-07-30 04:04:22,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 981/ 3125], loss: 0.238, per_step_time: 1414ms, lr: 6.2351824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:22,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.65713 samples/s/p 2:04:11 } +2024-07-30 04:04:25,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 983/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 6.2318336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:25,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.65931 samples/s/p 2:04:05 } +2024-07-30 04:04:28,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 985/ 3125], loss: 0.249, per_step_time: 1414ms, lr: 6.228485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:28,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.65503 samples/s/p 2:04:08 } +2024-07-30 04:04:30,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 987/ 3125], loss: 0.120, per_step_time: 1414ms, lr: 6.2251356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:30,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.65705 samples/s/p 2:04:02 } +2024-07-30 04:04:33,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 989/ 3125], loss: 0.135, per_step_time: 1418ms, lr: 6.221786e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:33,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.63934 samples/s/p 2:04:23 } +2024-07-30 04:04:36,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 991/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 6.218435e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:36,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.66141 samples/s/p 2:03:51 } +2024-07-30 04:04:39,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 993/ 3125], loss: 0.431, per_step_time: 1415ms, lr: 6.215085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:39,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.65112 samples/s/p 2:04:02 } +2024-07-30 04:04:42,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 995/ 3125], loss: 0.215, per_step_time: 1417ms, lr: 6.2117324e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:42,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.64264 samples/s/p 2:04:10 } +2024-07-30 04:04:45,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 997/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 6.2083805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:45,178 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |█████████████████████ | 5.66134 samples/s/p 2:03:42 } +2024-07-30 04:04:48,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 999/ 3125], loss: 0.067, per_step_time: 1413ms, lr: 6.205027e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:48,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |█████████████████████ | 5.65775 samples/s/p 2:03:44 } +2024-07-30 04:04:50,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1001/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 6.2016743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:50,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.65992 samples/s/p 2:03:39 } +2024-07-30 04:04:53,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1003/ 3125], loss: 0.272, per_step_time: 1414ms, lr: 6.19832e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:53,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.65719 samples/s/p 2:03:39 } +2024-07-30 04:04:56,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1005/ 3125], loss: 0.246, per_step_time: 1412ms, lr: 6.194966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:56,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.66184 samples/s/p 2:03:31 } +2024-07-30 04:04:59,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1007/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 6.19161e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:59,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.65857 samples/s/p 2:03:32 } +2024-07-30 04:05:02,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1009/ 3125], loss: 0.139, per_step_time: 1413ms, lr: 6.1882547e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:02,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.65978 samples/s/p 2:03:28 } +2024-07-30 04:05:05,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1011/ 3125], loss: 0.428, per_step_time: 1418ms, lr: 6.1848987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:05,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.63853 samples/s/p 2:03:53 } +2024-07-30 04:05:07,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1013/ 3125], loss: 0.426, per_step_time: 1417ms, lr: 6.1815417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:07,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.64362 samples/s/p 2:03:43 } +2024-07-30 04:05:10,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1015/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 6.178185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:10,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.65996 samples/s/p 2:03:19 } +2024-07-30 04:05:13,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1017/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 6.174826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:13,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.65976 samples/s/p 2:03:16 } +2024-07-30 04:05:16,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1019/ 3125], loss: 0.236, per_step_time: 1414ms, lr: 6.1714672e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:16,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.65714 samples/s/p 2:03:17 } +2024-07-30 04:05:19,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1021/ 3125], loss: 0.113, per_step_time: 1413ms, lr: 6.1681085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:19,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.65964 samples/s/p 2:03:11 } +2024-07-30 04:05:22,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1023/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 6.1647493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:22,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.66016 samples/s/p 2:03:07 } +2024-07-30 04:05:24,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1025/ 3125], loss: 0.211, per_step_time: 1414ms, lr: 6.161389e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:24,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.65407 samples/s/p 2:03:12 } +2024-07-30 04:05:27,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1027/ 3125], loss: 0.275, per_step_time: 1414ms, lr: 6.158028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:27,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.65597 samples/s/p 2:03:07 } +2024-07-30 04:05:30,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1029/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 6.1546666e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:30,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.66081 samples/s/p 2:02:58 } +2024-07-30 04:05:33,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1031/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 6.1513047e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:33,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.65873 samples/s/p 2:02:58 } +2024-07-30 04:05:36,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1033/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 6.147943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:36,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.65951 samples/s/p 2:02:54 } +2024-07-30 04:05:39,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1035/ 3125], loss: 0.040, per_step_time: 1412ms, lr: 6.1445794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:39,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.66197 samples/s/p 2:02:48 } +2024-07-30 04:05:41,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1037/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 6.1412165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:41,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.66006 samples/s/p 2:02:48 } +2024-07-30 04:05:44,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1039/ 3125], loss: 0.218, per_step_time: 1412ms, lr: 6.137852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:44,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.66209 samples/s/p 2:02:42 } +2024-07-30 04:05:47,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1041/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 6.134487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:47,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.66114 samples/s/p 2:02:41 } +2024-07-30 04:05:50,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1043/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 6.131122e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:50,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.66058 samples/s/p 2:02:38 } +2024-07-30 04:05:53,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1045/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 6.1277565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:53,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.66039 samples/s/p 2:02:36 } +2024-07-30 04:05:56,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1047/ 3125], loss: 0.124, per_step_time: 1413ms, lr: 6.124391e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:56,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.66040 samples/s/p 2:02:33 } +2024-07-30 04:05:58,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1049/ 3125], loss: 0.225, per_step_time: 1414ms, lr: 6.121024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:58,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.65769 samples/s/p 2:02:34 } +2024-07-30 04:06:01,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1051/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 6.117656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:01,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.65811 samples/s/p 2:02:30 } +2024-07-30 04:06:04,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1053/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 6.114288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:04,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.65803 samples/s/p 2:02:28 } +2024-07-30 04:06:07,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1055/ 3125], loss: 0.335, per_step_time: 1413ms, lr: 6.1109204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:07,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.66002 samples/s/p 2:02:22 } +2024-07-30 04:06:10,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1057/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 6.107551e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:10,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.66001 samples/s/p 2:02:19 } +2024-07-30 04:06:13,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1059/ 3125], loss: 0.107, per_step_time: 1412ms, lr: 6.1041824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:13,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.66198 samples/s/p 2:02:14 } +2024-07-30 04:06:15,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1061/ 3125], loss: 0.301, per_step_time: 1412ms, lr: 6.100812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:15,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.66198 samples/s/p 2:02:11 } +2024-07-30 04:06:18,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1063/ 3125], loss: 0.454, per_step_time: 1413ms, lr: 6.097441e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:18,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.66170 samples/s/p 2:02:09 } +2024-07-30 04:06:21,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1065/ 3125], loss: 0.363, per_step_time: 1413ms, lr: 6.0940706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:21,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.65976 samples/s/p 2:02:08 } +2024-07-30 04:06:24,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1067/ 3125], loss: 0.380, per_step_time: 1413ms, lr: 6.090699e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:24,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.65893 samples/s/p 2:02:07 } +2024-07-30 04:06:27,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1069/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 6.0873276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:27,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.66047 samples/s/p 2:02:02 } +2024-07-30 04:06:30,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1071/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 6.083955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:30,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.66108 samples/s/p 2:01:58 } +2024-07-30 04:06:32,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1073/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 6.0805814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:32,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.66022 samples/s/p 2:01:57 } +2024-07-30 04:06:35,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1075/ 3125], loss: 0.729, per_step_time: 1414ms, lr: 6.0772086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:35,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.65741 samples/s/p 2:01:57 } +2024-07-30 04:06:35,720 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 04:07:10,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1077/ 3125], loss: 0.403, per_step_time: 1656ms, lr: 6.0738334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:10,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 4.82805 samples/s/p 2:22:51 } +2024-07-30 04:07:13,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1079/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 6.070459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:13,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.66008 samples/s/p 2:01:48 } +2024-07-30 04:07:16,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1081/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 6.0670845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:16,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.65961 samples/s/p 2:01:46 } +2024-07-30 04:07:18,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1083/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 6.0637085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:18,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.65919 samples/s/p 2:01:44 } +2024-07-30 04:07:21,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1085/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 6.060332e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:21,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.66033 samples/s/p 2:01:39 } +2024-07-30 04:07:24,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1087/ 3125], loss: 0.442, per_step_time: 1413ms, lr: 6.056956e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:24,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.65913 samples/s/p 2:01:38 } +2024-07-30 04:07:27,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1089/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 6.0535785e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:27,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.65913 samples/s/p 2:01:35 } +2024-07-30 04:07:30,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1091/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 6.0502007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:30,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.65894 samples/s/p 2:01:33 } +2024-07-30 04:07:33,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1093/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 6.0468233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:33,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.66074 samples/s/p 2:01:28 } +2024-07-30 04:07:35,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1095/ 3125], loss: 0.273, per_step_time: 1415ms, lr: 6.043444e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:35,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.65005 samples/s/p 2:01:39 } +2024-07-30 04:07:38,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1097/ 3125], loss: 0.269, per_step_time: 1416ms, lr: 6.0400653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:38,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.64953 samples/s/p 2:01:36 } +2024-07-30 04:07:41,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1099/ 3125], loss: 0.246, per_step_time: 1414ms, lr: 6.0366856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:41,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.65724 samples/s/p 2:01:24 } +2024-07-30 04:07:44,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1101/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 6.0333055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:44,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.66024 samples/s/p 2:01:17 } +2024-07-30 04:07:47,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1103/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 6.0299253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:47,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.66041 samples/s/p 2:01:14 } +2024-07-30 04:07:50,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1105/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 6.026544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:50,089 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.66025 samples/s/p 2:01:11 } +2024-07-30 04:07:52,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1107/ 3125], loss: 0.338, per_step_time: 1414ms, lr: 6.023162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:52,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.65657 samples/s/p 2:01:13 } +2024-07-30 04:07:55,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1109/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 6.01978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:55,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.66137 samples/s/p 2:01:04 } +2024-07-30 04:07:58,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1111/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 6.016398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:58,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.65935 samples/s/p 2:01:04 } +2024-07-30 04:08:01,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1113/ 3125], loss: 0.096, per_step_time: 1413ms, lr: 6.013014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:01,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.65901 samples/s/p 2:01:02 } +2024-07-30 04:08:04,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1115/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 6.009631e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:04,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.65893 samples/s/p 2:00:59 } +2024-07-30 04:08:07,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1117/ 3125], loss: 0.078, per_step_time: 1413ms, lr: 6.0062466e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:07,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.66045 samples/s/p 2:00:54 } +2024-07-30 04:08:09,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1119/ 3125], loss: 0.270, per_step_time: 1414ms, lr: 6.0028624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:09,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.65417 samples/s/p 2:00:59 } +2024-07-30 04:08:12,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1121/ 3125], loss: 0.190, per_step_time: 1412ms, lr: 5.9994773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:12,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.66214 samples/s/p 2:00:46 } +2024-07-30 04:08:15,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1123/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 5.9960917e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:15,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.65836 samples/s/p 2:00:48 } +2024-07-30 04:08:18,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1125/ 3125], loss: 0.346, per_step_time: 1414ms, lr: 5.992706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:18,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.65429 samples/s/p 2:00:51 } +2024-07-30 04:08:21,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1127/ 3125], loss: 0.462, per_step_time: 1414ms, lr: 5.9893196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:21,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.65691 samples/s/p 2:00:44 } +2024-07-30 04:08:24,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1129/ 3125], loss: 0.196, per_step_time: 1414ms, lr: 5.985932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:24,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.65711 samples/s/p 2:00:41 } +2024-07-30 04:08:26,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1131/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 5.9825456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:26,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.65979 samples/s/p 2:00:35 } +2024-07-30 04:08:29,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1133/ 3125], loss: 0.263, per_step_time: 1415ms, lr: 5.9791573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:29,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.65333 samples/s/p 2:00:41 } +2024-07-30 04:08:32,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1135/ 3125], loss: 0.382, per_step_time: 1413ms, lr: 5.975769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:32,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.66015 samples/s/p 2:00:29 } +2024-07-30 04:08:35,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1137/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 5.9723807e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:35,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.66038 samples/s/p 2:00:26 } +2024-07-30 04:08:38,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1139/ 3125], loss: 0.242, per_step_time: 1412ms, lr: 5.968991e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:38,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.66194 samples/s/p 2:00:21 } +2024-07-30 04:08:41,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1141/ 3125], loss: 0.280, per_step_time: 1412ms, lr: 5.9656018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:41,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.66191 samples/s/p 2:00:18 } +2024-07-30 04:08:43,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1143/ 3125], loss: 0.434, per_step_time: 1413ms, lr: 5.962211e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:43,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.66007 samples/s/p 2:00:18 } +2024-07-30 04:08:46,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1145/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 5.958821e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:46,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.66127 samples/s/p 2:00:13 } +2024-07-30 04:08:49,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1147/ 3125], loss: 0.402, per_step_time: 1416ms, lr: 5.95543e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:49,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.64790 samples/s/p 2:00:28 } +2024-07-30 04:08:52,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1149/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 5.952038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:52,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.65948 samples/s/p 2:00:10 } +2024-07-30 04:08:55,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1151/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 5.948646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:55,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.66169 samples/s/p 2:00:04 } +2024-07-30 04:08:58,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1153/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 5.9452536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:58,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.66065 samples/s/p 2:00:03 } +2024-07-30 04:09:00,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1155/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 5.941861e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:00,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.65994 samples/s/p 2:00:01 } +2024-07-30 04:09:03,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1157/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 5.9384674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:03,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.66082 samples/s/p 1:59:57 } +2024-07-30 04:09:06,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1159/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 5.935074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:06,617 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.65901 samples/s/p 1:59:57 } +2024-07-30 04:09:09,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1161/ 3125], loss: 0.220, per_step_time: 1415ms, lr: 5.9316794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:09,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.65299 samples/s/p 2:00:01 } +2024-07-30 04:09:12,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1163/ 3125], loss: 0.257, per_step_time: 1414ms, lr: 5.9282843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:12,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.65543 samples/s/p 1:59:55 } +2024-07-30 04:09:15,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1165/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 5.92489e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:15,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.65888 samples/s/p 1:59:48 } +2024-07-30 04:09:17,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1167/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 5.921494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:17,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.65798 samples/s/p 1:59:47 } +2024-07-30 04:09:20,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1169/ 3125], loss: 0.143, per_step_time: 1414ms, lr: 5.9180984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:20,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.65404 samples/s/p 1:59:49 } +2024-07-30 04:09:23,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1171/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 5.914702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:23,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.65897 samples/s/p 1:59:40 } +2024-07-30 04:09:26,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1173/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 5.911305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:26,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.65625 samples/s/p 1:59:40 } +2024-07-30 04:09:29,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1175/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 5.9079075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:29,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.65948 samples/s/p 1:59:33 } +2024-07-30 04:09:32,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1177/ 3125], loss: 0.103, per_step_time: 1413ms, lr: 5.90451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:32,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.65989 samples/s/p 1:59:30 } +2024-07-30 04:09:34,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1179/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 5.9011118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:34,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.66038 samples/s/p 1:59:27 } +2024-07-30 04:09:37,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1181/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 5.897713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:37,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.66013 samples/s/p 1:59:24 } +2024-07-30 04:09:40,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1183/ 3125], loss: 0.202, per_step_time: 1415ms, lr: 5.8943137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:40,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.65282 samples/s/p 1:59:30 } +2024-07-30 04:09:43,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1185/ 3125], loss: 0.230, per_step_time: 1414ms, lr: 5.890914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:43,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.65747 samples/s/p 1:59:22 } +2024-07-30 04:09:46,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1187/ 3125], loss: 0.055, per_step_time: 1414ms, lr: 5.887515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:46,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.65458 samples/s/p 1:59:23 } +2024-07-30 04:09:49,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1189/ 3125], loss: 0.270, per_step_time: 1414ms, lr: 5.884114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:49,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |███████████████████████ | 5.65504 samples/s/p 1:59:19 } +2024-07-30 04:09:51,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1191/ 3125], loss: 0.289, per_step_time: 1414ms, lr: 5.880714e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:51,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |███████████████████████ | 5.65663 samples/s/p 1:59:14 } +2024-07-30 04:09:54,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1193/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 5.877312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:54,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.65916 samples/s/p 1:59:08 } +2024-07-30 04:09:57,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1195/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 5.8739106e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:57,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.66110 samples/s/p 1:59:03 } +2024-07-30 04:10:00,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1197/ 3125], loss: 0.185, per_step_time: 1412ms, lr: 5.870509e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:00,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.66238 samples/s/p 1:58:59 } +2024-07-30 04:10:03,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1199/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 5.867106e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:03,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.66095 samples/s/p 1:58:58 } +2024-07-30 04:10:06,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1201/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 5.863704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:06,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.66080 samples/s/p 1:58:55 } +2024-07-30 04:10:08,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1203/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 5.8603005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:08,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.65976 samples/s/p 1:58:53 } +2024-07-30 04:10:11,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1205/ 3125], loss: 0.396, per_step_time: 1413ms, lr: 5.8568967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:11,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.66131 samples/s/p 1:58:49 } +2024-07-30 04:10:14,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1207/ 3125], loss: 0.055, per_step_time: 1413ms, lr: 5.8534924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:14,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.65899 samples/s/p 1:58:49 } +2024-07-30 04:10:17,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1209/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 5.8500887e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:17,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.66085 samples/s/p 1:58:44 } +2024-07-30 04:10:20,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1211/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 5.846684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:20,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.66022 samples/s/p 1:58:41 } +2024-07-30 04:10:23,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1213/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 5.843279e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:23,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.65808 samples/s/p 1:58:41 } +2024-07-30 04:10:26,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1215/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 5.8398728e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:26,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.66162 samples/s/p 1:58:34 } +2024-07-30 04:10:28,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1217/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 5.8364662e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:28,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.65856 samples/s/p 1:58:35 } +2024-07-30 04:10:31,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1219/ 3125], loss: 0.381, per_step_time: 1413ms, lr: 5.83306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:31,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.66064 samples/s/p 1:58:30 } +2024-07-30 04:10:34,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1221/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 5.829653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:34,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.66151 samples/s/p 1:58:26 } +2024-07-30 04:10:37,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1223/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 5.826246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:37,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.65934 samples/s/p 1:58:26 } +2024-07-30 04:10:40,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1225/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 5.8228384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:40,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.65982 samples/s/p 1:58:22 } +2024-07-30 04:10:43,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1227/ 3125], loss: 0.120, per_step_time: 1414ms, lr: 5.81943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:43,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.65743 samples/s/p 1:58:22 } +2024-07-30 04:10:45,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1229/ 3125], loss: 0.150, per_step_time: 1414ms, lr: 5.8160213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:45,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.65740 samples/s/p 1:58:20 } +2024-07-30 04:10:48,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1231/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 5.8126125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:48,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.65923 samples/s/p 1:58:14 } +2024-07-30 04:10:51,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1233/ 3125], loss: 0.504, per_step_time: 1414ms, lr: 5.8092037e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:51,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.65529 samples/s/p 1:58:17 } +2024-07-30 04:10:54,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1235/ 3125], loss: 0.378, per_step_time: 1416ms, lr: 5.805794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:54,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.64941 samples/s/p 1:58:21 } +2024-07-30 04:10:57,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1237/ 3125], loss: 0.145, per_step_time: 1414ms, lr: 5.8023843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:57,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.65467 samples/s/p 1:58:12 } +2024-07-30 04:11:00,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1239/ 3125], loss: 0.475, per_step_time: 1413ms, lr: 5.7989732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:00,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.66012 samples/s/p 1:58:02 } +2024-07-30 04:11:02,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1241/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 5.7955635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:02,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.66119 samples/s/p 1:57:58 } +2024-07-30 04:11:05,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1243/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 5.7921516e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:05,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.66130 samples/s/p 1:57:55 } +2024-07-30 04:11:08,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1245/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 5.7887405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:08,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.66088 samples/s/p 1:57:53 } +2024-07-30 04:11:11,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1247/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 5.7853285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:11,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.66084 samples/s/p 1:57:50 } +2024-07-30 04:11:14,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1249/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 5.781916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:14,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.66100 samples/s/p 1:57:47 } +2024-07-30 04:11:17,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1251/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 5.7785032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:17,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.65975 samples/s/p 1:57:46 } +2024-07-30 04:11:19,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1253/ 3125], loss: 0.485, per_step_time: 1413ms, lr: 5.7750904e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:19,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.65810 samples/s/p 1:57:45 } +2024-07-30 04:11:22,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1255/ 3125], loss: 0.230, per_step_time: 1415ms, lr: 5.7716775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:22,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.65261 samples/s/p 1:57:49 } +2024-07-30 04:11:25,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1257/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 5.7682632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:25,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.65979 samples/s/p 1:57:37 } +2024-07-30 04:11:28,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1259/ 3125], loss: 0.243, per_step_time: 1415ms, lr: 5.7648494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:28,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.65290 samples/s/p 1:57:43 } +2024-07-30 04:11:31,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1261/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 5.7614347e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:31,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.65887 samples/s/p 1:57:32 } +2024-07-30 04:11:34,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1263/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 5.75802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:34,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.65900 samples/s/p 1:57:30 } +2024-07-30 04:11:36,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1265/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 5.754605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:36,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.66053 samples/s/p 1:57:25 } +2024-07-30 04:11:39,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1267/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 5.7511893e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:39,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.65943 samples/s/p 1:57:23 } +2024-07-30 04:11:42,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1269/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 5.7477737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:42,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.65884 samples/s/p 1:57:21 } +2024-07-30 04:11:45,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1271/ 3125], loss: 0.181, per_step_time: 1414ms, lr: 5.7443576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:45,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.65503 samples/s/p 1:57:23 } +2024-07-30 04:11:48,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1273/ 3125], loss: 0.089, per_step_time: 1413ms, lr: 5.7409397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:48,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.66063 samples/s/p 1:57:13 } +2024-07-30 04:11:51,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1275/ 3125], loss: 0.160, per_step_time: 1413ms, lr: 5.737523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:51,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.66131 samples/s/p 1:57:10 } +2024-07-30 04:11:53,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1277/ 3125], loss: 0.148, per_step_time: 1413ms, lr: 5.7341063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:53,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.65867 samples/s/p 1:57:10 } +2024-07-30 04:11:56,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1279/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 5.7306884e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:56,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.66016 samples/s/p 1:57:05 } +2024-07-30 04:11:59,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1281/ 3125], loss: 0.137, per_step_time: 1414ms, lr: 5.7272705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:59,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.65583 samples/s/p 1:57:08 } +2024-07-30 04:12:02,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1283/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 5.723852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:02,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.65878 samples/s/p 1:57:02 } +2024-07-30 04:12:05,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1285/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 5.7204334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:05,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.66098 samples/s/p 1:56:56 } +2024-07-30 04:12:08,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1287/ 3125], loss: 0.295, per_step_time: 1414ms, lr: 5.717014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:08,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.65527 samples/s/p 1:57:00 } +2024-07-30 04:12:10,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1289/ 3125], loss: 0.341, per_step_time: 1413ms, lr: 5.713595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:10,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.65962 samples/s/p 1:56:52 } +2024-07-30 04:12:13,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1291/ 3125], loss: 0.583, per_step_time: 1417ms, lr: 5.7101756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:13,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.64495 samples/s/p 1:57:07 } +2024-07-30 04:12:16,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1293/ 3125], loss: 0.199, per_step_time: 1414ms, lr: 5.7067546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:16,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.65629 samples/s/p 1:56:50 } +2024-07-30 04:12:19,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1295/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 5.703335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:19,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.66071 samples/s/p 1:56:42 } +2024-07-30 04:12:22,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1297/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 5.6999133e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:22,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.66115 samples/s/p 1:56:39 } +2024-07-30 04:12:25,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1299/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 5.6964927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:25,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.66025 samples/s/p 1:56:37 } +2024-07-30 04:12:27,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1301/ 3125], loss: 0.448, per_step_time: 1413ms, lr: 5.6930708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:27,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.66146 samples/s/p 1:56:33 } +2024-07-30 04:12:30,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1303/ 3125], loss: 0.185, per_step_time: 1415ms, lr: 5.6896492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:30,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.65363 samples/s/p 1:56:40 } +2024-07-30 04:12:33,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1305/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 5.6862277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:33,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.65825 samples/s/p 1:56:31 } +2024-07-30 04:12:36,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1307/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 5.682805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:36,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.65893 samples/s/p 1:56:27 } +2024-07-30 04:12:39,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1309/ 3125], loss: 0.323, per_step_time: 1413ms, lr: 5.679382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:39,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.66132 samples/s/p 1:56:22 } +2024-07-30 04:12:42,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1311/ 3125], loss: 0.169, per_step_time: 1413ms, lr: 5.675959e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:42,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.66043 samples/s/p 1:56:20 } +2024-07-30 04:12:44,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1313/ 3125], loss: 0.169, per_step_time: 1413ms, lr: 5.6725357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:44,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.66034 samples/s/p 1:56:17 } +2024-07-30 04:12:47,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1315/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 5.669112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:47,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.66031 samples/s/p 1:56:14 } +2024-07-30 04:12:50,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1317/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 5.665688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:50,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.66156 samples/s/p 1:56:10 } +2024-07-30 04:12:53,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1319/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 5.6622634e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:53,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.65945 samples/s/p 1:56:10 } +2024-07-30 04:12:56,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1321/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 5.658839e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:56,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.65974 samples/s/p 1:56:07 } +2024-07-30 04:12:59,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1323/ 3125], loss: 0.222, per_step_time: 1414ms, lr: 5.6554136e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:59,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.65733 samples/s/p 1:56:07 } +2024-07-30 04:13:01,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1325/ 3125], loss: 0.387, per_step_time: 1413ms, lr: 5.651989e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:01,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.65977 samples/s/p 1:56:01 } +2024-07-30 04:13:04,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1327/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 5.6485633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:04,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.65874 samples/s/p 1:55:59 } +2024-07-30 04:13:07,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1329/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 5.645137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:07,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.66011 samples/s/p 1:55:55 } +2024-07-30 04:13:10,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1331/ 3125], loss: 0.310, per_step_time: 1415ms, lr: 5.6417107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:10,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.65037 samples/s/p 1:56:04 } +2024-07-30 04:13:13,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1333/ 3125], loss: 0.272, per_step_time: 1414ms, lr: 5.6382846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:13,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.65380 samples/s/p 1:55:57 } +2024-07-30 04:13:16,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1335/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 5.6348576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:16,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.65809 samples/s/p 1:55:49 } +2024-07-30 04:13:18,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1337/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 5.63143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:18,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.65915 samples/s/p 1:55:45 } +2024-07-30 04:13:21,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1339/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 5.6280032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:21,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.66136 samples/s/p 1:55:39 } +2024-07-30 04:13:24,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1341/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 5.624575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:24,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.66013 samples/s/p 1:55:38 } +2024-07-30 04:13:27,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1343/ 3125], loss: 0.159, per_step_time: 1414ms, lr: 5.621147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:27,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.65616 samples/s/p 1:55:40 } +2024-07-30 04:13:30,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1345/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 5.6177187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:30,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.65787 samples/s/p 1:55:35 } +2024-07-30 04:13:33,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1347/ 3125], loss: 0.235, per_step_time: 1414ms, lr: 5.61429e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:33,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.65499 samples/s/p 1:55:36 } +2024-07-30 04:13:35,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1349/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 5.6108615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:35,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.65798 samples/s/p 1:55:29 } +2024-07-30 04:13:38,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1351/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 5.607432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:38,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.65930 samples/s/p 1:55:25 } +2024-07-30 04:13:41,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1353/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 5.604002e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:41,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.65898 samples/s/p 1:55:22 } +2024-07-30 04:13:44,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1355/ 3125], loss: 0.400, per_step_time: 1413ms, lr: 5.600573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:44,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.66141 samples/s/p 1:55:17 } +2024-07-30 04:13:47,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1357/ 3125], loss: 0.158, per_step_time: 1413ms, lr: 5.597143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:47,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.65967 samples/s/p 1:55:16 } +2024-07-30 04:13:50,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1359/ 3125], loss: 0.180, per_step_time: 1415ms, lr: 5.593712e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:50,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.65316 samples/s/p 1:55:21 } +2024-07-30 04:13:52,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1361/ 3125], loss: 0.378, per_step_time: 1412ms, lr: 5.590282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:52,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.66173 samples/s/p 1:55:08 } +2024-07-30 04:13:55,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1363/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 5.5868504e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:55,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.65810 samples/s/p 1:55:09 } +2024-07-30 04:13:58,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1365/ 3125], loss: 0.329, per_step_time: 1414ms, lr: 5.583419e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:58,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.65416 samples/s/p 1:55:11 } +2024-07-30 04:14:01,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1367/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 5.579988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:01,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.66025 samples/s/p 1:55:01 } +2024-07-30 04:14:04,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1369/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 5.5765563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:04,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.66047 samples/s/p 1:54:58 } +2024-07-30 04:14:07,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1371/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 5.5731243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:07,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |███████████████████████ | 5.66170 samples/s/p 1:54:54 } +2024-07-30 04:14:09,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1373/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 5.5696914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:09,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |███████████████████████ | 5.65870 samples/s/p 1:54:54 } +2024-07-30 04:14:12,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1375/ 3125], loss: 0.419, per_step_time: 1413ms, lr: 5.566259e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:12,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.66153 samples/s/p 1:54:48 } +2024-07-30 04:14:15,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1377/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 5.562826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:15,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.66024 samples/s/p 1:54:47 } +2024-07-30 04:14:18,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1379/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 5.5593937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:18,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.65811 samples/s/p 1:54:47 } +2024-07-30 04:14:21,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1381/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 5.55596e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:21,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.65789 samples/s/p 1:54:44 } +2024-07-30 04:14:24,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1383/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 5.5525265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:24,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.65974 samples/s/p 1:54:39 } +2024-07-30 04:14:26,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1385/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 5.5490923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:26,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.65846 samples/s/p 1:54:38 } +2024-07-30 04:14:29,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1387/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 5.5456576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:29,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.65877 samples/s/p 1:54:34 } +2024-07-30 04:14:32,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1389/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 5.5422233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:32,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.66057 samples/s/p 1:54:29 } +2024-07-30 04:14:35,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1391/ 3125], loss: 0.410, per_step_time: 1413ms, lr: 5.538789e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:35,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.65788 samples/s/p 1:54:30 } +2024-07-30 04:14:38,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1393/ 3125], loss: 0.129, per_step_time: 1414ms, lr: 5.5353544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:38,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.65705 samples/s/p 1:54:28 } +2024-07-30 04:14:41,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1395/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 5.5319188e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:41,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.65797 samples/s/p 1:54:24 } +2024-07-30 04:14:43,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1397/ 3125], loss: 0.091, per_step_time: 1414ms, lr: 5.5284827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:43,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.65681 samples/s/p 1:54:23 } +2024-07-30 04:14:46,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1399/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 5.5250475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:46,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.65843 samples/s/p 1:54:18 } +2024-07-30 04:14:49,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1401/ 3125], loss: 0.230, per_step_time: 1414ms, lr: 5.521611e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:49,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.65731 samples/s/p 1:54:16 } +2024-07-30 04:14:52,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1403/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 5.5181754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:52,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.66022 samples/s/p 1:54:10 } +2024-07-30 04:14:55,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1405/ 3125], loss: 0.088, per_step_time: 1413ms, lr: 5.514739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:55,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.66089 samples/s/p 1:54:06 } +2024-07-30 04:14:58,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1407/ 3125], loss: 0.266, per_step_time: 1414ms, lr: 5.5113014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:58,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.65655 samples/s/p 1:54:09 } +2024-07-30 04:15:00,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1409/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 5.507865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:00,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.65907 samples/s/p 1:54:03 } +2024-07-30 04:15:03,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1411/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 5.5044275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:03,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.66008 samples/s/p 1:53:59 } +2024-07-30 04:15:06,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1413/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 5.5009905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:06,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.66051 samples/s/p 1:53:56 } +2024-07-30 04:15:09,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1415/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 5.497553e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:09,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.65785 samples/s/p 1:53:56 } +2024-07-30 04:15:12,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1417/ 3125], loss: 0.527, per_step_time: 1413ms, lr: 5.4941147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:12,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.66084 samples/s/p 1:53:50 } +2024-07-30 04:15:15,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1419/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 5.490676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:15,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.66063 samples/s/p 1:53:47 } +2024-07-30 04:15:17,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1421/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 5.487238e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:17,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.65966 samples/s/p 1:53:45 } +2024-07-30 04:15:20,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1423/ 3125], loss: 0.402, per_step_time: 1414ms, lr: 5.483799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:20,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.65651 samples/s/p 1:53:46 } +2024-07-30 04:15:23,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1425/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 5.480361e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:23,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.65957 samples/s/p 1:53:40 } +2024-07-30 04:15:26,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1427/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 5.4769216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:26,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.65827 samples/s/p 1:53:39 } +2024-07-30 04:15:29,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1429/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 5.4734824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:29,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.65851 samples/s/p 1:53:35 } +2024-07-30 04:15:32,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1431/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 5.470042e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:32,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.65966 samples/s/p 1:53:31 } +2024-07-30 04:15:34,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1433/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 5.466603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:34,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.66149 samples/s/p 1:53:26 } +2024-07-30 04:15:37,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1435/ 3125], loss: 0.118, per_step_time: 1413ms, lr: 5.4631632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:37,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.66061 samples/s/p 1:53:24 } +2024-07-30 04:15:40,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1437/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 5.4597226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:40,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.66163 samples/s/p 1:53:20 } +2024-07-30 04:15:43,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1439/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 5.4562825e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:43,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.66160 samples/s/p 1:53:18 } +2024-07-30 04:15:46,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1441/ 3125], loss: 0.353, per_step_time: 1413ms, lr: 5.4528414e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:46,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.66164 samples/s/p 1:53:15 } +2024-07-30 04:15:49,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1443/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 5.449401e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:49,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.65819 samples/s/p 1:53:16 } +2024-07-30 04:15:51,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1445/ 3125], loss: 0.317, per_step_time: 1415ms, lr: 5.4459592e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:51,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.65072 samples/s/p 1:53:22 } +2024-07-30 04:15:54,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1447/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 5.4425186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:54,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.65949 samples/s/p 1:53:09 } +2024-07-30 04:15:57,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1449/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 5.4390775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:57,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.65954 samples/s/p 1:53:06 } +2024-07-30 04:16:00,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1451/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 5.435635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:00,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.65911 samples/s/p 1:53:04 } +2024-07-30 04:16:03,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1453/ 3125], loss: 0.465, per_step_time: 1415ms, lr: 5.432193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:03,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.65186 samples/s/p 1:53:09 } +2024-07-30 04:16:06,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1455/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 5.428751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:06,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.65993 samples/s/p 1:52:57 } +2024-07-30 04:16:09,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1457/ 3125], loss: 0.395, per_step_time: 1414ms, lr: 5.4253087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:09,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.65721 samples/s/p 1:52:57 } +2024-07-30 04:16:11,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1459/ 3125], loss: 0.303, per_step_time: 1412ms, lr: 5.4218663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:11,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.66173 samples/s/p 1:52:49 } +2024-07-30 04:16:14,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1461/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 5.418424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:14,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.66082 samples/s/p 1:52:47 } +2024-07-30 04:16:17,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1463/ 3125], loss: 0.189, per_step_time: 1414ms, lr: 5.4149805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:17,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.65735 samples/s/p 1:52:49 } +2024-07-30 04:16:20,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1465/ 3125], loss: 0.274, per_step_time: 1412ms, lr: 5.4115376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:20,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.66224 samples/s/p 1:52:40 } +2024-07-30 04:16:23,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1467/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 5.408094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:23,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.66033 samples/s/p 1:52:40 } +2024-07-30 04:16:26,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1469/ 3125], loss: 0.137, per_step_time: 1414ms, lr: 5.4046504e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:26,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.65648 samples/s/p 1:52:41 } +2024-07-30 04:16:28,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1471/ 3125], loss: 0.181, per_step_time: 1414ms, lr: 5.401207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:28,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.65434 samples/s/p 1:52:41 } +2024-07-30 04:16:31,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1473/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 5.3977633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:31,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.65918 samples/s/p 1:52:32 } +2024-07-30 04:16:34,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1475/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 5.3943186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:34,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.66169 samples/s/p 1:52:27 } +2024-07-30 04:16:37,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1477/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 5.390875e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:37,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.66005 samples/s/p 1:52:26 } +2024-07-30 04:16:40,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1479/ 3125], loss: 0.233, per_step_time: 1414ms, lr: 5.38743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:40,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.65723 samples/s/p 1:52:26 } +2024-07-30 04:16:43,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1481/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 5.3839854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:43,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.65901 samples/s/p 1:52:21 } +2024-07-30 04:16:45,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1483/ 3125], loss: 0.105, per_step_time: 1413ms, lr: 5.380541e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:45,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.65781 samples/s/p 1:52:20 } +2024-07-30 04:16:48,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1485/ 3125], loss: 0.235, per_step_time: 1413ms, lr: 5.377095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:48,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.65780 samples/s/p 1:52:17 } +2024-07-30 04:16:51,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1487/ 3125], loss: 0.394, per_step_time: 1413ms, lr: 5.3736508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:51,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.66067 samples/s/p 1:52:11 } +2024-07-30 04:16:54,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1489/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 5.3702047e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:54,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.66073 samples/s/p 1:52:08 } +2024-07-30 04:16:57,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1491/ 3125], loss: 0.266, per_step_time: 1412ms, lr: 5.366759e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:57,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.66225 samples/s/p 1:52:03 } +2024-07-30 04:17:00,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1493/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 5.363314e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:00,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.65937 samples/s/p 1:52:04 } +2024-07-30 04:17:02,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1495/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 5.359868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:02,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.65948 samples/s/p 1:52:01 } +2024-07-30 04:17:05,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1497/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 5.3564213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:05,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.66048 samples/s/p 1:51:57 } +2024-07-30 04:17:08,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1499/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 5.3529757e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:08,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.65955 samples/s/p 1:51:55 } +2024-07-30 04:17:11,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1501/ 3125], loss: 0.433, per_step_time: 1412ms, lr: 5.349529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:11,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.66191 samples/s/p 1:51:50 } +2024-07-30 04:17:14,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1503/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 5.346082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:14,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.66017 samples/s/p 1:51:49 } +2024-07-30 04:17:17,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1505/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 5.342636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:17,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.65965 samples/s/p 1:51:47 } +2024-07-30 04:17:19,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1507/ 3125], loss: 0.189, per_step_time: 1415ms, lr: 5.3391886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:19,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.65173 samples/s/p 1:51:53 } +2024-07-30 04:17:22,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1509/ 3125], loss: 0.314, per_step_time: 1414ms, lr: 5.3357408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:22,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.65638 samples/s/p 1:51:45 } +2024-07-30 04:17:25,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1511/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 5.3322938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:25,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.65921 samples/s/p 1:51:39 } +2024-07-30 04:17:28,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1513/ 3125], loss: 0.266, per_step_time: 1414ms, lr: 5.3288472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:28,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.65733 samples/s/p 1:51:38 } +2024-07-30 04:17:31,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1515/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 5.3253993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:31,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.65865 samples/s/p 1:51:34 } +2024-07-30 04:17:34,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1517/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 5.321952e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:34,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.65954 samples/s/p 1:51:30 } +2024-07-30 04:17:36,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1519/ 3125], loss: 0.241, per_step_time: 1412ms, lr: 5.318504e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:36,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.66180 samples/s/p 1:51:24 } +2024-07-30 04:17:39,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1521/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 5.3150557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:39,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.66083 samples/s/p 1:51:23 } +2024-07-30 04:17:42,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1523/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 5.311608e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:42,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.66057 samples/s/p 1:51:20 } +2024-07-30 04:17:45,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1525/ 3125], loss: 0.259, per_step_time: 1412ms, lr: 5.3081594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:45,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.66256 samples/s/p 1:51:15 } +2024-07-30 04:17:48,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1527/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 5.3047115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:48,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.65980 samples/s/p 1:51:15 } +2024-07-30 04:17:51,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1529/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 5.301262e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:51,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.66106 samples/s/p 1:51:11 } +2024-07-30 04:17:53,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1531/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 5.2978135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:53,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.66054 samples/s/p 1:51:09 } +2024-07-30 04:17:56,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1533/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 5.2943647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:56,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.65908 samples/s/p 1:51:08 } +2024-07-30 04:17:59,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1535/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 5.290916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:59,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.66063 samples/s/p 1:51:03 } +2024-07-30 04:18:02,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1537/ 3125], loss: 0.267, per_step_time: 1414ms, lr: 5.287467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:02,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.65705 samples/s/p 1:51:04 } +2024-07-30 04:18:05,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1539/ 3125], loss: 0.230, per_step_time: 1414ms, lr: 5.2840173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:05,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.65748 samples/s/p 1:51:01 } +2024-07-30 04:18:08,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1541/ 3125], loss: 0.258, per_step_time: 1412ms, lr: 5.280567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:08,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.66221 samples/s/p 1:50:53 } +2024-07-30 04:18:10,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1543/ 3125], loss: 0.397, per_step_time: 1414ms, lr: 5.277118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:10,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.65467 samples/s/p 1:50:59 } +2024-07-30 04:18:13,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1545/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 5.2736686e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:13,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.66085 samples/s/p 1:50:49 } +2024-07-30 04:18:16,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1547/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 5.270219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:16,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.66081 samples/s/p 1:50:46 } +2024-07-30 04:18:19,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1549/ 3125], loss: 0.224, per_step_time: 1414ms, lr: 5.2667688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:19,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.65763 samples/s/p 1:50:47 } +2024-07-30 04:18:22,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1551/ 3125], loss: 0.416, per_step_time: 1414ms, lr: 5.263318e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:22,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.65414 samples/s/p 1:50:48 } +2024-07-30 04:18:25,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1553/ 3125], loss: 0.129, per_step_time: 1413ms, lr: 5.259868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:25,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.65810 samples/s/p 1:50:41 } +2024-07-30 04:18:27,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1555/ 3125], loss: 0.323, per_step_time: 1414ms, lr: 5.256418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:27,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.65406 samples/s/p 1:50:43 } +2024-07-30 04:18:30,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1557/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 5.252967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:30,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.66152 samples/s/p 1:50:31 } +2024-07-30 04:18:33,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1559/ 3125], loss: 0.420, per_step_time: 1413ms, lr: 5.2495175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:33,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |████████████████████████ | 5.65820 samples/s/p 1:50:32 } +2024-07-30 04:18:36,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1561/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 5.2460664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:36,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |████████████████████████ | 5.65791 samples/s/p 1:50:30 } +2024-07-30 04:18:39,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1563/ 3125], loss: 0.212, per_step_time: 1414ms, lr: 5.2426153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:39,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.65406 samples/s/p 1:50:31 } +2024-07-30 04:18:42,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1565/ 3125], loss: 0.401, per_step_time: 1414ms, lr: 5.2391642e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:42,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.65766 samples/s/p 1:50:24 } +2024-07-30 04:18:44,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1567/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 5.235713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:44,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.66051 samples/s/p 1:50:18 } +2024-07-30 04:18:47,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1569/ 3125], loss: 0.161, per_step_time: 1414ms, lr: 5.232262e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:47,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.65406 samples/s/p 1:50:23 } +2024-07-30 04:18:50,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1571/ 3125], loss: 0.227, per_step_time: 1412ms, lr: 5.2288115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:50,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.66279 samples/s/p 1:50:10 } +2024-07-30 04:18:53,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1573/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 5.225359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:53,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.66005 samples/s/p 1:50:10 } +2024-07-30 04:18:56,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1575/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 5.2219075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:56,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.66033 samples/s/p 1:50:07 } +2024-07-30 04:18:59,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1577/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 5.2184564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:59,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.65864 samples/s/p 1:50:06 } +2024-07-30 04:19:01,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1579/ 3125], loss: 0.439, per_step_time: 1413ms, lr: 5.2150044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:01,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.65893 samples/s/p 1:50:03 } +2024-07-30 04:19:04,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1581/ 3125], loss: 0.413, per_step_time: 1416ms, lr: 5.2115533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:04,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.64618 samples/s/p 1:50:15 } +2024-07-30 04:19:07,565 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1583/ 3125], loss: 0.246, per_step_time: 1412ms, lr: 5.2081014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:07,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.66204 samples/s/p 1:49:54 } +2024-07-30 04:19:10,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1585/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 5.204649e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:10,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.65963 samples/s/p 1:49:54 } +2024-07-30 04:19:13,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1587/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 5.2011965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:13,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.65866 samples/s/p 1:49:52 } +2024-07-30 04:19:16,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1589/ 3125], loss: 0.198, per_step_time: 1416ms, lr: 5.197744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:16,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.64705 samples/s/p 1:50:03 } +2024-07-30 04:19:18,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1591/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 5.1942925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:18,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.66080 samples/s/p 1:49:44 } +2024-07-30 04:19:21,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1593/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 5.19084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:21,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.66030 samples/s/p 1:49:41 } +2024-07-30 04:19:24,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1595/ 3125], loss: 0.381, per_step_time: 1412ms, lr: 5.187388e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:24,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.66282 samples/s/p 1:49:36 } +2024-07-30 04:19:27,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1597/ 3125], loss: 0.323, per_step_time: 1414ms, lr: 5.1839343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:27,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.65576 samples/s/p 1:49:41 } +2024-07-30 04:19:30,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1599/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 5.1804823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:30,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.66109 samples/s/p 1:49:32 } +2024-07-30 04:19:33,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1601/ 3125], loss: 0.433, per_step_time: 1413ms, lr: 5.17703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:33,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.65924 samples/s/p 1:49:31 } +2024-07-30 04:19:35,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1603/ 3125], loss: 0.372, per_step_time: 1414ms, lr: 5.1735765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:35,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.65721 samples/s/p 1:49:31 } +2024-07-30 04:19:38,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1605/ 3125], loss: 0.489, per_step_time: 1412ms, lr: 5.170124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:38,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.66270 samples/s/p 1:49:22 } +2024-07-30 04:19:41,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1607/ 3125], loss: 0.258, per_step_time: 1414ms, lr: 5.166671e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:41,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.65582 samples/s/p 1:49:27 } +2024-07-30 04:19:44,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1609/ 3125], loss: 0.203, per_step_time: 1414ms, lr: 5.163218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:44,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.65617 samples/s/p 1:49:24 } +2024-07-30 04:19:47,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1611/ 3125], loss: 0.286, per_step_time: 1414ms, lr: 5.159764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:47,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.65649 samples/s/p 1:49:20 } +2024-07-30 04:19:50,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1613/ 3125], loss: 0.345, per_step_time: 1414ms, lr: 5.156311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:50,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.65522 samples/s/p 1:49:19 } +2024-07-30 04:19:52,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1615/ 3125], loss: 0.214, per_step_time: 1414ms, lr: 5.152858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:52,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.65741 samples/s/p 1:49:14 } +2024-07-30 04:19:55,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1617/ 3125], loss: 0.555, per_step_time: 1413ms, lr: 5.149405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:55,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.66168 samples/s/p 1:49:06 } +2024-07-30 04:19:58,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1619/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 5.1459515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:58,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.66020 samples/s/p 1:49:05 } +2024-07-30 04:20:01,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1621/ 3125], loss: 0.141, per_step_time: 1413ms, lr: 5.1424972e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:01,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.66099 samples/s/p 1:49:01 } +2024-07-30 04:20:04,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1623/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 5.1390443e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:04,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.65938 samples/s/p 1:49:00 } +2024-07-30 04:20:07,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1625/ 3125], loss: 0.078, per_step_time: 1417ms, lr: 5.1355905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:07,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.64343 samples/s/p 1:49:16 } +2024-07-30 04:20:09,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1627/ 3125], loss: 0.106, per_step_time: 1414ms, lr: 5.1321367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:09,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.65578 samples/s/p 1:48:59 } +2024-07-30 04:20:12,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1629/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 5.1286834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:12,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.65831 samples/s/p 1:48:53 } +2024-07-30 04:20:15,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1631/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 5.125229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:15,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.65964 samples/s/p 1:48:49 } +2024-07-30 04:20:18,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1633/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 5.1217744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:18,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.66022 samples/s/p 1:48:45 } +2024-07-30 04:20:21,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1635/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 5.118321e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:21,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.65914 samples/s/p 1:48:43 } +2024-07-30 04:20:24,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1637/ 3125], loss: 0.503, per_step_time: 1413ms, lr: 5.1148677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:24,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.65991 samples/s/p 1:48:40 } +2024-07-30 04:20:26,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1639/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 5.111413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:26,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.65989 samples/s/p 1:48:37 } +2024-07-30 04:20:29,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1641/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 5.107959e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:29,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.65937 samples/s/p 1:48:35 } +2024-07-30 04:20:32,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1643/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 5.104505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:32,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.66011 samples/s/p 1:48:31 } +2024-07-30 04:20:35,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1645/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 5.1010506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:35,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.66005 samples/s/p 1:48:28 } +2024-07-30 04:20:38,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1647/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 5.097596e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:38,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.66043 samples/s/p 1:48:25 } +2024-07-30 04:20:41,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1649/ 3125], loss: 0.307, per_step_time: 1412ms, lr: 5.0941417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:41,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.66248 samples/s/p 1:48:20 } +2024-07-30 04:20:43,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1651/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 5.090688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:43,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.65979 samples/s/p 1:48:20 } +2024-07-30 04:20:46,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1653/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 5.087233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:46,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.66040 samples/s/p 1:48:17 } +2024-07-30 04:20:49,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1655/ 3125], loss: 0.417, per_step_time: 1413ms, lr: 5.0837784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:49,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.65993 samples/s/p 1:48:14 } +2024-07-30 04:20:52,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1657/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 5.080324e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:52,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.65961 samples/s/p 1:48:12 } +2024-07-30 04:20:55,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1659/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 5.0768704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:55,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.65944 samples/s/p 1:48:09 } +2024-07-30 04:20:58,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1661/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 5.0734147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:58,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.66035 samples/s/p 1:48:05 } +2024-07-30 04:21:00,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1663/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 5.069961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:00,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.65949 samples/s/p 1:48:03 } +2024-07-30 04:21:03,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1665/ 3125], loss: 0.072, per_step_time: 1413ms, lr: 5.0665058e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:03,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.65912 samples/s/p 1:48:01 } +2024-07-30 04:21:06,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1667/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 5.0630515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:06,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.65915 samples/s/p 1:47:58 } +2024-07-30 04:21:09,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1669/ 3125], loss: 0.248, per_step_time: 1414ms, lr: 5.0595963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:09,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.65735 samples/s/p 1:47:57 } +2024-07-30 04:21:12,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1671/ 3125], loss: 0.339, per_step_time: 1414ms, lr: 5.056142e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:12,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.65679 samples/s/p 1:47:55 } +2024-07-30 04:21:15,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1673/ 3125], loss: 0.259, per_step_time: 1415ms, lr: 5.0526874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:15,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.65139 samples/s/p 1:47:59 } +2024-07-30 04:21:17,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1675/ 3125], loss: 0.445, per_step_time: 1413ms, lr: 5.049232e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:17,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.65818 samples/s/p 1:47:48 } +2024-07-30 04:21:20,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1677/ 3125], loss: 0.251, per_step_time: 1415ms, lr: 5.0457775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:20,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.65315 samples/s/p 1:47:51 } +2024-07-30 04:21:23,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1679/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 5.0423228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:23,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.66076 samples/s/p 1:47:39 } +2024-07-30 04:21:26,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1681/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 5.038868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:26,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.66056 samples/s/p 1:47:37 } +2024-07-30 04:21:29,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1683/ 3125], loss: 0.127, per_step_time: 1413ms, lr: 5.035413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:29,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.65975 samples/s/p 1:47:35 } +2024-07-30 04:21:32,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1685/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 5.031958e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:32,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.65956 samples/s/p 1:47:32 } +2024-07-30 04:21:34,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1687/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 5.028503e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:34,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.65797 samples/s/p 1:47:31 } +2024-07-30 04:21:37,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1689/ 3125], loss: 0.306, per_step_time: 1414ms, lr: 5.0250483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:37,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.65741 samples/s/p 1:47:29 } +2024-07-30 04:21:40,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1691/ 3125], loss: 0.229, per_step_time: 1412ms, lr: 5.0215936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:40,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.66233 samples/s/p 1:47:21 } +2024-07-30 04:21:43,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1693/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 5.018139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:43,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.66036 samples/s/p 1:47:20 } +2024-07-30 04:21:46,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1695/ 3125], loss: 0.254, per_step_time: 1414ms, lr: 5.014684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:46,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.65599 samples/s/p 1:47:22 } +2024-07-30 04:21:49,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1697/ 3125], loss: 0.421, per_step_time: 1413ms, lr: 5.011229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:49,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.65923 samples/s/p 1:47:16 } +2024-07-30 04:21:51,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1699/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 5.0077733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:51,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.65943 samples/s/p 1:47:13 } +2024-07-30 04:21:54,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1701/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 5.0043186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:54,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.66105 samples/s/p 1:47:08 } +2024-07-30 04:21:57,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1703/ 3125], loss: 0.478, per_step_time: 1413ms, lr: 5.0008643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:57,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.66060 samples/s/p 1:47:06 } +2024-07-30 04:22:00,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1705/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 4.997409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:00,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.65884 samples/s/p 1:47:05 } +2024-07-30 04:22:03,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1707/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 4.993954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:03,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.66064 samples/s/p 1:47:00 } +2024-07-30 04:22:06,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1709/ 3125], loss: 0.307, per_step_time: 1414ms, lr: 4.9904984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:06,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.65768 samples/s/p 1:47:01 } +2024-07-30 04:22:08,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1711/ 3125], loss: 0.178, per_step_time: 1412ms, lr: 4.987043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:08,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.66253 samples/s/p 1:46:52 } +2024-07-30 04:22:11,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1713/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 4.9835885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:11,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.66056 samples/s/p 1:46:52 } +2024-07-30 04:22:14,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1715/ 3125], loss: 0.193, per_step_time: 1412ms, lr: 4.980134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:14,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.66279 samples/s/p 1:46:46 } +2024-07-30 04:22:17,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1717/ 3125], loss: 0.197, per_step_time: 1414ms, lr: 4.9766795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:17,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.65687 samples/s/p 1:46:50 } +2024-07-30 04:22:20,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1719/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 4.9732243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:20,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.65983 samples/s/p 1:46:44 } +2024-07-30 04:22:23,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1721/ 3125], loss: 0.137, per_step_time: 1413ms, lr: 4.9697696e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:23,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.65961 samples/s/p 1:46:41 } +2024-07-30 04:22:25,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1723/ 3125], loss: 0.300, per_step_time: 1414ms, lr: 4.9663136e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:25,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.65524 samples/s/p 1:46:43 } +2024-07-30 04:22:28,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1725/ 3125], loss: 0.293, per_step_time: 1413ms, lr: 4.962859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:28,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.65848 samples/s/p 1:46:37 } +2024-07-30 04:22:31,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1727/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 4.9594046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:31,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.66127 samples/s/p 1:46:31 } +2024-07-30 04:22:34,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1729/ 3125], loss: 0.349, per_step_time: 1413ms, lr: 4.95595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:34,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.66071 samples/s/p 1:46:29 } +2024-07-30 04:22:37,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1731/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 4.952495e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:37,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.65815 samples/s/p 1:46:29 } +2024-07-30 04:22:40,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1733/ 3125], loss: 0.057, per_step_time: 1413ms, lr: 4.9490404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:40,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.66018 samples/s/p 1:46:24 } +2024-07-30 04:22:42,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1735/ 3125], loss: 0.251, per_step_time: 1414ms, lr: 4.9455857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:42,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.65649 samples/s/p 1:46:25 } +2024-07-30 04:22:45,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1737/ 3125], loss: 0.193, per_step_time: 1415ms, lr: 4.9421305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:45,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.65207 samples/s/p 1:46:27 } +2024-07-30 04:22:48,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1739/ 3125], loss: 0.235, per_step_time: 1413ms, lr: 4.938676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:48,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.65926 samples/s/p 1:46:16 } +2024-07-30 04:22:51,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1741/ 3125], loss: 0.430, per_step_time: 1412ms, lr: 4.935221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:51,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.66295 samples/s/p 1:46:09 } +2024-07-30 04:22:54,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1743/ 3125], loss: 0.451, per_step_time: 1413ms, lr: 4.9317664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:54,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.66083 samples/s/p 1:46:09 } +2024-07-30 04:22:57,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1745/ 3125], loss: 0.326, per_step_time: 1412ms, lr: 4.928312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:57,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.66212 samples/s/p 1:46:05 } +2024-07-30 04:22:59,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1747/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 4.924858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:59,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |█████████████████████████ | 5.66081 samples/s/p 1:46:03 } +2024-07-30 04:23:02,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1749/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 4.9214036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:02,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |█████████████████████████ | 5.65960 samples/s/p 1:46:02 } +2024-07-30 04:23:05,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1751/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 4.917948e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:05,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.66107 samples/s/p 1:45:57 } +2024-07-30 04:23:08,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1753/ 3125], loss: 0.163, per_step_time: 1414ms, lr: 4.9144937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:08,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.65763 samples/s/p 1:45:58 } +2024-07-30 04:23:11,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1755/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 4.911039e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:11,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.65773 samples/s/p 1:45:55 } +2024-07-30 04:23:14,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1757/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 4.9075848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:14,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.65401 samples/s/p 1:45:57 } +2024-07-30 04:23:16,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1759/ 3125], loss: 0.143, per_step_time: 1412ms, lr: 4.904131e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:16,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.66242 samples/s/p 1:45:44 } +2024-07-30 04:23:19,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1761/ 3125], loss: 0.269, per_step_time: 1414ms, lr: 4.9006767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:19,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.65765 samples/s/p 1:45:47 } +2024-07-30 04:23:22,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1763/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 4.8972224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:22,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.66143 samples/s/p 1:45:40 } +2024-07-30 04:23:25,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1765/ 3125], loss: 0.257, per_step_time: 1412ms, lr: 4.8937677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:25,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.66230 samples/s/p 1:45:36 } +2024-07-30 04:23:28,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1767/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 4.8903134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:28,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.65836 samples/s/p 1:45:38 } +2024-07-30 04:23:31,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1769/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 4.8868596e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:31,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.65860 samples/s/p 1:45:35 } +2024-07-30 04:23:33,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1771/ 3125], loss: 0.291, per_step_time: 1413ms, lr: 4.883406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:33,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.65943 samples/s/p 1:45:31 } +2024-07-30 04:23:36,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1773/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 4.879952e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:36,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.65922 samples/s/p 1:45:28 } +2024-07-30 04:23:39,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1775/ 3125], loss: 0.125, per_step_time: 1413ms, lr: 4.8764978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:39,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.66026 samples/s/p 1:45:24 } +2024-07-30 04:23:42,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1777/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 4.873044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:42,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.66083 samples/s/p 1:45:21 } +2024-07-30 04:23:45,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1779/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 4.8695906e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:45,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.66000 samples/s/p 1:45:19 } +2024-07-30 04:23:48,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1781/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 4.866136e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:48,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.66042 samples/s/p 1:45:16 } +2024-07-30 04:23:50,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1783/ 3125], loss: 0.181, per_step_time: 1412ms, lr: 4.8626825e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:50,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.66218 samples/s/p 1:45:11 } +2024-07-30 04:23:53,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1785/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 4.859229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:53,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.65949 samples/s/p 1:45:11 } +2024-07-30 04:23:56,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1787/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 4.855775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:56,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.65996 samples/s/p 1:45:08 } +2024-07-30 04:23:59,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1789/ 3125], loss: 0.286, per_step_time: 1414ms, lr: 4.852322e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:59,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.65631 samples/s/p 1:45:09 } +2024-07-30 04:24:02,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1791/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 4.8488687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:02,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.65891 samples/s/p 1:45:03 } +2024-07-30 04:24:05,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1793/ 3125], loss: 0.276, per_step_time: 1414ms, lr: 4.845416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:05,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.65651 samples/s/p 1:45:03 } +2024-07-30 04:24:07,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1795/ 3125], loss: 0.285, per_step_time: 1414ms, lr: 4.8419615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:07,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.65766 samples/s/p 1:44:59 } +2024-07-30 04:24:10,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1797/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 4.8385086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:10,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.65836 samples/s/p 1:44:55 } +2024-07-30 04:24:13,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1799/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 4.8350553e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:13,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.66148 samples/s/p 1:44:49 } +2024-07-30 04:24:16,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1801/ 3125], loss: 0.288, per_step_time: 1415ms, lr: 4.8316024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:16,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.65267 samples/s/p 1:44:56 } +2024-07-30 04:24:19,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1803/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 4.82815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:19,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.66060 samples/s/p 1:44:44 } +2024-07-30 04:24:22,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1805/ 3125], loss: 0.420, per_step_time: 1412ms, lr: 4.824697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:22,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.66256 samples/s/p 1:44:39 } +2024-07-30 04:24:25,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1807/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 4.821244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:25,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.66036 samples/s/p 1:44:39 } +2024-07-30 04:24:27,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1809/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 4.8177913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:27,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.66125 samples/s/p 1:44:35 } +2024-07-30 04:24:30,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1811/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 4.814338e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:30,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.66120 samples/s/p 1:44:32 } +2024-07-30 04:24:33,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1813/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 4.810886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:33,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.65862 samples/s/p 1:44:32 } +2024-07-30 04:24:36,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1815/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 4.8074335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:36,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.66054 samples/s/p 1:44:27 } +2024-07-30 04:24:39,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1817/ 3125], loss: 0.556, per_step_time: 1413ms, lr: 4.8039815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:39,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.65951 samples/s/p 1:44:26 } +2024-07-30 04:24:42,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1819/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 4.800529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:42,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.66109 samples/s/p 1:44:21 } +2024-07-30 04:24:44,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1821/ 3125], loss: 0.168, per_step_time: 1412ms, lr: 4.797077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:44,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.66173 samples/s/p 1:44:18 } +2024-07-30 04:24:47,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1823/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 4.793624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:47,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.65799 samples/s/p 1:44:19 } +2024-07-30 04:24:50,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1825/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 4.7901726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:50,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.66015 samples/s/p 1:44:14 } +2024-07-30 04:24:53,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1827/ 3125], loss: 0.103, per_step_time: 1413ms, lr: 4.7867206e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:53,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.65866 samples/s/p 1:44:13 } +2024-07-30 04:24:56,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1829/ 3125], loss: 0.094, per_step_time: 1413ms, lr: 4.7832696e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:56,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.66001 samples/s/p 1:44:08 } +2024-07-30 04:24:59,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1831/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 4.779817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:59,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.66023 samples/s/p 1:44:05 } +2024-07-30 04:25:01,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1833/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 4.776366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:01,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.66061 samples/s/p 1:44:02 } +2024-07-30 04:25:04,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1835/ 3125], loss: 0.141, per_step_time: 1413ms, lr: 4.772915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:04,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.66044 samples/s/p 1:43:59 } +2024-07-30 04:25:07,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1837/ 3125], loss: 0.406, per_step_time: 1417ms, lr: 4.769464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:07,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.64463 samples/s/p 1:44:14 } +2024-07-30 04:25:10,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1839/ 3125], loss: 0.384, per_step_time: 1413ms, lr: 4.766012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:10,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.66093 samples/s/p 1:43:53 } +2024-07-30 04:25:13,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1841/ 3125], loss: 0.415, per_step_time: 1413ms, lr: 4.762561e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:13,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.65787 samples/s/p 1:43:54 } +2024-07-30 04:25:16,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1843/ 3125], loss: 0.231, per_step_time: 1414ms, lr: 4.7591093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:16,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.65489 samples/s/p 1:43:54 } +2024-07-30 04:25:18,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1845/ 3125], loss: 0.663, per_step_time: 1416ms, lr: 4.755659e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:18,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.64701 samples/s/p 1:44:00 } +2024-07-30 04:25:21,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1847/ 3125], loss: 0.470, per_step_time: 1413ms, lr: 4.7522085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:21,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.65939 samples/s/p 1:43:43 } +2024-07-30 04:25:24,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1849/ 3125], loss: 0.412, per_step_time: 1414ms, lr: 4.748758e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:24,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.65695 samples/s/p 1:43:43 } +2024-07-30 04:25:27,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1851/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 4.7453073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:27,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.66066 samples/s/p 1:43:36 } +2024-07-30 04:25:30,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1853/ 3125], loss: 0.385, per_step_time: 1413ms, lr: 4.741856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:30,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.65946 samples/s/p 1:43:35 } +2024-07-30 04:25:33,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1855/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 4.738406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:33,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.66082 samples/s/p 1:43:31 } +2024-07-30 04:25:35,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1857/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 4.734956e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:35,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.66081 samples/s/p 1:43:28 } +2024-07-30 04:25:38,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1859/ 3125], loss: 0.089, per_step_time: 1414ms, lr: 4.731506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:38,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.65436 samples/s/p 1:43:32 } +2024-07-30 04:25:41,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1861/ 3125], loss: 0.364, per_step_time: 1414ms, lr: 4.728057e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:41,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.65750 samples/s/p 1:43:26 } +2024-07-30 04:25:44,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1863/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 4.7246062e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:44,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.65966 samples/s/p 1:43:21 } +2024-07-30 04:25:47,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1865/ 3125], loss: 0.362, per_step_time: 1414ms, lr: 4.721157e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:47,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.65707 samples/s/p 1:43:21 } +2024-07-30 04:25:50,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1867/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 4.717707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:50,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.65894 samples/s/p 1:43:16 } +2024-07-30 04:25:52,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1869/ 3125], loss: 0.168, per_step_time: 1412ms, lr: 4.7142576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:52,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.66193 samples/s/p 1:43:10 } +2024-07-30 04:25:55,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1871/ 3125], loss: 0.289, per_step_time: 1416ms, lr: 4.7108088e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:55,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.64927 samples/s/p 1:43:21 } +2024-07-30 04:25:58,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1873/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 4.70736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:58,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.66128 samples/s/p 1:43:05 } +2024-07-30 04:26:01,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1875/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 4.7039107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:01,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.65966 samples/s/p 1:43:04 } +2024-07-30 04:26:04,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1877/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 4.700462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:04,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.66035 samples/s/p 1:43:00 } +2024-07-30 04:26:07,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1879/ 3125], loss: 0.197, per_step_time: 1413ms, lr: 4.6970135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:07,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.65963 samples/s/p 1:42:58 } +2024-07-30 04:26:09,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1881/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 4.6935643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:09,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.65869 samples/s/p 1:42:56 } +2024-07-30 04:26:12,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1883/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 4.690116e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:12,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.65830 samples/s/p 1:42:54 } +2024-07-30 04:26:15,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1885/ 3125], loss: 0.450, per_step_time: 1412ms, lr: 4.686668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:15,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.66301 samples/s/p 1:42:46 } +2024-07-30 04:26:18,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1887/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 4.6832197e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:18,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.65902 samples/s/p 1:42:47 } +2024-07-30 04:26:21,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1889/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 4.679772e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:21,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.65995 samples/s/p 1:42:44 } +2024-07-30 04:26:24,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1891/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 4.6763244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:24,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.65829 samples/s/p 1:42:42 } +2024-07-30 04:26:26,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1893/ 3125], loss: 0.161, per_step_time: 1414ms, lr: 4.672877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:26,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.65668 samples/s/p 1:42:41 } +2024-07-30 04:26:29,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1895/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 4.6694286e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:29,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.66136 samples/s/p 1:42:34 } +2024-07-30 04:26:32,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1897/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 4.6659816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:32,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.66012 samples/s/p 1:42:32 } +2024-07-30 04:26:35,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1899/ 3125], loss: 0.394, per_step_time: 1413ms, lr: 4.662534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:35,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.65917 samples/s/p 1:42:30 } +2024-07-30 04:26:38,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1901/ 3125], loss: 0.136, per_step_time: 1412ms, lr: 4.659087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:38,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.66208 samples/s/p 1:42:24 } +2024-07-30 04:26:41,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1903/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 4.655641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:41,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.66004 samples/s/p 1:42:24 } +2024-07-30 04:26:43,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1905/ 3125], loss: 0.525, per_step_time: 1413ms, lr: 4.652194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:43,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.66167 samples/s/p 1:42:19 } +2024-07-30 04:26:46,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1907/ 3125], loss: 0.129, per_step_time: 1413ms, lr: 4.648748e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:46,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.65937 samples/s/p 1:42:19 } +2024-07-30 04:26:49,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1909/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 4.6453015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:49,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.66134 samples/s/p 1:42:14 } +2024-07-30 04:26:52,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1911/ 3125], loss: 0.398, per_step_time: 1413ms, lr: 4.6418545e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:52,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.66136 samples/s/p 1:42:11 } +2024-07-30 04:26:55,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1913/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 4.6384084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:55,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.66058 samples/s/p 1:42:09 } +2024-07-30 04:26:58,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1915/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 4.6349633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:58,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.66109 samples/s/p 1:42:06 } +2024-07-30 04:27:00,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1917/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 4.6315176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:00,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.65974 samples/s/p 1:42:04 } +2024-07-30 04:27:03,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1919/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 4.6280725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:03,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.66037 samples/s/p 1:42:01 } +2024-07-30 04:27:06,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1921/ 3125], loss: 0.118, per_step_time: 1413ms, lr: 4.624627e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:06,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.65794 samples/s/p 1:42:00 } +2024-07-30 04:27:09,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1923/ 3125], loss: 0.213, per_step_time: 1415ms, lr: 4.621182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:09,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.65298 samples/s/p 1:42:03 } +2024-07-30 04:27:12,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1925/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 4.617736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:12,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.65828 samples/s/p 1:41:54 } +2024-07-30 04:27:15,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1927/ 3125], loss: 0.150, per_step_time: 1414ms, lr: 4.614292e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:15,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.65736 samples/s/p 1:41:53 } +2024-07-30 04:27:17,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1929/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 4.6108476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:17,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.65879 samples/s/p 1:41:48 } +2024-07-30 04:27:20,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1931/ 3125], loss: 0.541, per_step_time: 1413ms, lr: 4.6074033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:20,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.66102 samples/s/p 1:41:43 } +2024-07-30 04:27:23,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1933/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 4.603959e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:23,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.65904 samples/s/p 1:41:42 } +2024-07-30 04:27:26,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1935/ 3125], loss: 0.469, per_step_time: 1413ms, lr: 4.6005152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:26,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.65848 samples/s/p 1:41:40 } +2024-07-30 04:27:29,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1937/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 4.5970714e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:29,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.65969 samples/s/p 1:41:36 } +2024-07-30 04:27:32,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1939/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 4.593627e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:32,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |███████████████████████████ | 5.65978 samples/s/p 1:41:33 } +2024-07-30 04:27:34,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1941/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 4.590184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:34,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |███████████████████████████ | 5.65926 samples/s/p 1:41:31 } +2024-07-30 04:27:37,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1943/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 4.586741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:37,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.66006 samples/s/p 1:41:27 } +2024-07-30 04:27:40,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1945/ 3125], loss: 0.203, per_step_time: 1414ms, lr: 4.5832976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:40,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.65440 samples/s/p 1:41:30 } +2024-07-30 04:27:43,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1947/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 4.579855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:43,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.65972 samples/s/p 1:41:22 } +2024-07-30 04:27:46,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1949/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 4.5764127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:46,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.65843 samples/s/p 1:41:20 } +2024-07-30 04:27:49,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1951/ 3125], loss: 0.128, per_step_time: 1414ms, lr: 4.5729703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:49,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.65558 samples/s/p 1:41:21 } +2024-07-30 04:27:51,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1953/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 4.5695274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:51,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.66063 samples/s/p 1:41:12 } +2024-07-30 04:27:54,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1955/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 4.5660854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:54,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.65781 samples/s/p 1:41:13 } +2024-07-30 04:27:57,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1957/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 4.5626434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:57,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.66072 samples/s/p 1:41:07 } +2024-07-30 04:28:00,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1959/ 3125], loss: 0.388, per_step_time: 1413ms, lr: 4.559202e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:00,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.65966 samples/s/p 1:41:05 } +2024-07-30 04:28:03,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1961/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 4.555761e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:03,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.66069 samples/s/p 1:41:01 } +2024-07-30 04:28:06,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1963/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 4.55232e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:06,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.66086 samples/s/p 1:40:58 } +2024-07-30 04:28:08,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1965/ 3125], loss: 0.447, per_step_time: 1413ms, lr: 4.5488787e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:08,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.66128 samples/s/p 1:40:55 } +2024-07-30 04:28:11,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1967/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 4.5454376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:11,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.66081 samples/s/p 1:40:52 } +2024-07-30 04:28:14,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1969/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 4.5419965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:14,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.65987 samples/s/p 1:40:51 } +2024-07-30 04:28:17,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1971/ 3125], loss: 0.551, per_step_time: 1413ms, lr: 4.538557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:17,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.65965 samples/s/p 1:40:48 } +2024-07-30 04:28:20,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1973/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 4.535117e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:20,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.66050 samples/s/p 1:40:44 } +2024-07-30 04:28:23,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1975/ 3125], loss: 0.281, per_step_time: 1414ms, lr: 4.5316774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:23,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.65689 samples/s/p 1:40:45 } +2024-07-30 04:28:25,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1977/ 3125], loss: 0.380, per_step_time: 1413ms, lr: 4.5282372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:25,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.66073 samples/s/p 1:40:38 } +2024-07-30 04:28:28,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1979/ 3125], loss: 0.150, per_step_time: 1414ms, lr: 4.5247984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:28,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.65570 samples/s/p 1:40:41 } +2024-07-30 04:28:31,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1981/ 3125], loss: 0.378, per_step_time: 1412ms, lr: 4.521359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:31,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.66197 samples/s/p 1:40:31 } +2024-07-30 04:28:34,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1983/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 4.5179195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:34,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.66037 samples/s/p 1:40:30 } +2024-07-30 04:28:37,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1985/ 3125], loss: 0.598, per_step_time: 1413ms, lr: 4.5144807e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:37,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.65998 samples/s/p 1:40:28 } +2024-07-30 04:28:40,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1987/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 4.511043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:40,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.66146 samples/s/p 1:40:23 } +2024-07-30 04:28:42,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1989/ 3125], loss: 0.072, per_step_time: 1412ms, lr: 4.507604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:42,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.66288 samples/s/p 1:40:19 } +2024-07-30 04:28:45,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1991/ 3125], loss: 0.251, per_step_time: 1412ms, lr: 4.504166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:45,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.66280 samples/s/p 1:40:16 } +2024-07-30 04:28:48,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1993/ 3125], loss: 0.312, per_step_time: 1414ms, lr: 4.5007287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:48,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.65716 samples/s/p 1:40:19 } +2024-07-30 04:28:51,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1995/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 4.4972912e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:51,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.65948 samples/s/p 1:40:14 } +2024-07-30 04:28:54,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1997/ 3125], loss: 0.273, per_step_time: 1414ms, lr: 4.493853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:54,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.65770 samples/s/p 1:40:13 } +2024-07-30 04:28:57,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1999/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 4.4904164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:57,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.65782 samples/s/p 1:40:10 } +2024-07-30 04:28:59,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2001/ 3125], loss: 0.130, per_step_time: 1414ms, lr: 4.486979e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:59,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.65753 samples/s/p 1:40:08 } +2024-07-30 04:29:02,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2003/ 3125], loss: 0.446, per_step_time: 1413ms, lr: 4.483543e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:02,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.66033 samples/s/p 1:40:02 } +2024-07-30 04:29:05,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2005/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 4.480107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:05,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.66045 samples/s/p 1:39:59 } +2024-07-30 04:29:08,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2007/ 3125], loss: 0.148, per_step_time: 1413ms, lr: 4.4766707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:08,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.65956 samples/s/p 1:39:57 } +2024-07-30 04:29:11,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2009/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 4.4732346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:11,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.66065 samples/s/p 1:39:53 } +2024-07-30 04:29:14,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2011/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 4.4697986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:14,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.65815 samples/s/p 1:39:53 } +2024-07-30 04:29:16,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2013/ 3125], loss: 0.226, per_step_time: 1414ms, lr: 4.466363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:16,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.65683 samples/s/p 1:39:52 } +2024-07-30 04:29:19,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2015/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 4.4629282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:19,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.66105 samples/s/p 1:39:44 } +2024-07-30 04:29:22,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2017/ 3125], loss: 0.346, per_step_time: 1413ms, lr: 4.4594935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:22,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.65924 samples/s/p 1:39:43 } +2024-07-30 04:29:25,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2019/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 4.4560597e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:25,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.65970 samples/s/p 1:39:40 } +2024-07-30 04:29:28,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2021/ 3125], loss: 0.144, per_step_time: 1414ms, lr: 4.4526246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:28,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.65436 samples/s/p 1:39:43 } +2024-07-30 04:29:31,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2023/ 3125], loss: 0.206, per_step_time: 1414ms, lr: 4.449191e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:31,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.65706 samples/s/p 1:39:37 } +2024-07-30 04:29:33,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2025/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 4.445756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:33,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.65501 samples/s/p 1:39:37 } +2024-07-30 04:29:36,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2027/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 4.442323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:36,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.65924 samples/s/p 1:39:29 } +2024-07-30 04:29:39,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2029/ 3125], loss: 0.114, per_step_time: 1425ms, lr: 4.4388903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:39,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.61367 samples/s/p 1:40:15 } +2024-07-30 04:29:42,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2031/ 3125], loss: 0.126, per_step_time: 1415ms, lr: 4.435457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:42,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.65213 samples/s/p 1:39:31 } +2024-07-30 04:29:45,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2033/ 3125], loss: 0.208, per_step_time: 1412ms, lr: 4.432024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:45,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.66278 samples/s/p 1:39:17 } +2024-07-30 04:29:48,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2035/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 4.428592e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:48,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.66095 samples/s/p 1:39:16 } +2024-07-30 04:29:50,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2037/ 3125], loss: 0.384, per_step_time: 1413ms, lr: 4.42516e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:50,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.66018 samples/s/p 1:39:14 } +2024-07-30 04:29:53,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2039/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 4.4217286e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:53,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.66067 samples/s/p 1:39:11 } +2024-07-30 04:29:56,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2041/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 4.4182957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:56,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.66144 samples/s/p 1:39:07 } +2024-07-30 04:29:59,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2043/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 4.414865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:59,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.65832 samples/s/p 1:39:08 } +2024-07-30 04:30:02,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2045/ 3125], loss: 0.360, per_step_time: 1412ms, lr: 4.4114336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:02,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.66193 samples/s/p 1:39:01 } +2024-07-30 04:30:05,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2047/ 3125], loss: 0.136, per_step_time: 1442ms, lr: 4.408003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:05,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.54543 samples/s/p 1:41:03 } +2024-07-30 04:30:08,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2049/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 4.404573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:08,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.66011 samples/s/p 1:38:57 } +2024-07-30 04:30:10,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2051/ 3125], loss: 0.457, per_step_time: 1413ms, lr: 4.4011426e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:10,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.66008 samples/s/p 1:38:54 } +2024-07-30 04:30:13,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2053/ 3125], loss: 0.081, per_step_time: 1413ms, lr: 4.3977125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:13,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.66076 samples/s/p 1:38:51 } +2024-07-30 04:30:16,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2055/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 4.3942828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:16,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.66025 samples/s/p 1:38:49 } +2024-07-30 04:30:19,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2057/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 4.390853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:19,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.65978 samples/s/p 1:38:46 } +2024-07-30 04:30:22,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2059/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 4.387424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:22,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.65950 samples/s/p 1:38:44 } +2024-07-30 04:30:25,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2061/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 4.3839955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:25,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.65902 samples/s/p 1:38:41 } +2024-07-30 04:30:27,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2063/ 3125], loss: 0.240, per_step_time: 1414ms, lr: 4.380567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:27,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.65699 samples/s/p 1:38:41 } +2024-07-30 04:30:30,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2065/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 4.377139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:30,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.65961 samples/s/p 1:38:35 } +2024-07-30 04:30:33,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2067/ 3125], loss: 0.456, per_step_time: 1413ms, lr: 4.3737114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:33,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.65874 samples/s/p 1:38:33 } +2024-07-30 04:30:36,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2069/ 3125], loss: 0.345, per_step_time: 1412ms, lr: 4.3702826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:36,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.66213 samples/s/p 1:38:27 } +2024-07-30 04:30:39,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2071/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 4.3668556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:39,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.66053 samples/s/p 1:38:26 } +2024-07-30 04:30:42,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2073/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 4.3634286e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:42,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.65851 samples/s/p 1:38:25 } +2024-07-30 04:30:44,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2075/ 3125], loss: 0.453, per_step_time: 1413ms, lr: 4.3600025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:44,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.66004 samples/s/p 1:38:21 } +2024-07-30 04:30:47,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2077/ 3125], loss: 0.347, per_step_time: 1415ms, lr: 4.3565756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:47,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.65268 samples/s/p 1:38:25 } +2024-07-30 04:30:50,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2079/ 3125], loss: 0.239, per_step_time: 1414ms, lr: 4.35315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:50,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.65469 samples/s/p 1:38:20 } +2024-07-30 04:30:53,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2081/ 3125], loss: 0.294, per_step_time: 1414ms, lr: 4.3497243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:53,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.65647 samples/s/p 1:38:16 } +2024-07-30 04:30:56,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2083/ 3125], loss: 0.231, per_step_time: 1416ms, lr: 4.346298e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:56,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.64615 samples/s/p 1:38:24 } +2024-07-30 04:30:59,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2085/ 3125], loss: 0.124, per_step_time: 1413ms, lr: 4.342873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:59,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.65939 samples/s/p 1:38:07 } +2024-07-30 04:31:01,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2087/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 4.339449e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:01,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.66106 samples/s/p 1:38:02 } +2024-07-30 04:31:04,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2089/ 3125], loss: 0.176, per_step_time: 1412ms, lr: 4.3360237e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:04,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.66231 samples/s/p 1:37:58 } +2024-07-30 04:31:07,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2091/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 4.3326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:07,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.66090 samples/s/p 1:37:57 } +2024-07-30 04:31:10,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2093/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 4.329176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:10,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.66121 samples/s/p 1:37:54 } +2024-07-30 04:31:13,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2095/ 3125], loss: 0.234, per_step_time: 1412ms, lr: 4.3257533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:13,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.66207 samples/s/p 1:37:50 } +2024-07-30 04:31:16,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2097/ 3125], loss: 0.252, per_step_time: 1412ms, lr: 4.3223286e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:16,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.66204 samples/s/p 1:37:47 } +2024-07-30 04:31:18,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2099/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 4.318906e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:18,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.65961 samples/s/p 1:37:47 } +2024-07-30 04:31:21,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2101/ 3125], loss: 0.409, per_step_time: 1412ms, lr: 4.3154832e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:21,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.66253 samples/s/p 1:37:41 } +2024-07-30 04:31:24,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2103/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 4.3120613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:24,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.66009 samples/s/p 1:37:41 } +2024-07-30 04:31:27,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2105/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 4.3086397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:27,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.66030 samples/s/p 1:37:38 } +2024-07-30 04:31:30,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2107/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 4.305218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:30,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.65961 samples/s/p 1:37:36 } +2024-07-30 04:31:33,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2109/ 3125], loss: 0.384, per_step_time: 1413ms, lr: 4.3017967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:33,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.65967 samples/s/p 1:37:33 } +2024-07-30 04:31:35,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2111/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 4.298376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:35,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.66019 samples/s/p 1:37:29 } +2024-07-30 04:31:38,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2113/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 4.2949546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:38,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.65860 samples/s/p 1:37:28 } +2024-07-30 04:31:41,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2115/ 3125], loss: 0.449, per_step_time: 1413ms, lr: 4.2915344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:41,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.66068 samples/s/p 1:37:23 } +2024-07-30 04:31:44,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2117/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 4.2881147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:44,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.65890 samples/s/p 1:37:22 } +2024-07-30 04:31:47,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2119/ 3125], loss: 0.334, per_step_time: 1413ms, lr: 4.2846955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:47,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.65867 samples/s/p 1:37:20 } +2024-07-30 04:31:50,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2121/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 4.281276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:50,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |███████████████████████████ | 5.66108 samples/s/p 1:37:14 } +2024-07-30 04:31:52,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2123/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 4.2778574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:52,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |███████████████████████████ | 5.65914 samples/s/p 1:37:14 } +2024-07-30 04:31:55,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2125/ 3125], loss: 0.325, per_step_time: 1414ms, lr: 4.274439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:55,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.65516 samples/s/p 1:37:15 } +2024-07-30 04:31:58,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2127/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 4.27102e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:58,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.65989 samples/s/p 1:37:07 } +2024-07-30 04:32:01,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2129/ 3125], loss: 0.390, per_step_time: 1413ms, lr: 4.2676024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:01,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.66016 samples/s/p 1:37:04 } +2024-07-30 04:32:04,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2131/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 4.264185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:04,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.66031 samples/s/p 1:37:01 } +2024-07-30 04:32:07,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2133/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 4.2607676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:07,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.65957 samples/s/p 1:36:59 } +2024-07-30 04:32:09,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2135/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 4.257351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:09,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.66075 samples/s/p 1:36:55 } +2024-07-30 04:32:12,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2137/ 3125], loss: 0.383, per_step_time: 1413ms, lr: 4.253935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:12,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.65784 samples/s/p 1:36:55 } +2024-07-30 04:32:15,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2139/ 3125], loss: 0.202, per_step_time: 1415ms, lr: 4.250519e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:15,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.65182 samples/s/p 1:36:59 } +2024-07-30 04:32:18,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2141/ 3125], loss: 0.498, per_step_time: 1413ms, lr: 4.2471024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:18,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.66110 samples/s/p 1:36:46 } +2024-07-30 04:32:21,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2143/ 3125], loss: 0.146, per_step_time: 1414ms, lr: 4.2436873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:21,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.65667 samples/s/p 1:36:48 } +2024-07-30 04:32:24,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2145/ 3125], loss: 0.457, per_step_time: 1414ms, lr: 4.240272e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:24,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.65648 samples/s/p 1:36:45 } +2024-07-30 04:32:26,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2147/ 3125], loss: 0.206, per_step_time: 1414ms, lr: 4.2368574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:26,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.65686 samples/s/p 1:36:42 } +2024-07-30 04:32:29,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2149/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 4.2334436e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:29,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.66113 samples/s/p 1:36:35 } +2024-07-30 04:32:32,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2151/ 3125], loss: 0.194, per_step_time: 1414ms, lr: 4.23003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:32,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.65486 samples/s/p 1:36:38 } +2024-07-30 04:32:35,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2153/ 3125], loss: 0.188, per_step_time: 1414ms, lr: 4.226616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:35,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.65721 samples/s/p 1:36:33 } +2024-07-30 04:32:38,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2155/ 3125], loss: 0.256, per_step_time: 1418ms, lr: 4.2232023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:38,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.63817 samples/s/p 1:36:50 } +2024-07-30 04:32:41,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2157/ 3125], loss: 0.396, per_step_time: 1414ms, lr: 4.2197894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:41,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.65533 samples/s/p 1:36:29 } +2024-07-30 04:32:43,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2159/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 4.216377e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:43,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.65929 samples/s/p 1:36:23 } +2024-07-30 04:32:46,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2161/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 4.2129655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:46,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.65808 samples/s/p 1:36:21 } +2024-07-30 04:32:49,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2163/ 3125], loss: 0.292, per_step_time: 1413ms, lr: 4.209554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:49,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.65773 samples/s/p 1:36:18 } +2024-07-30 04:32:52,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2165/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 4.2061424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:52,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.66153 samples/s/p 1:36:12 } +2024-07-30 04:32:55,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2167/ 3125], loss: 0.211, per_step_time: 1414ms, lr: 4.2027314e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:55,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.65504 samples/s/p 1:36:16 } +2024-07-30 04:32:58,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2169/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 4.19932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:58,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.66089 samples/s/p 1:36:07 } +2024-07-30 04:33:00,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2171/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 4.19591e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:00,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.66123 samples/s/p 1:36:04 } +2024-07-30 04:33:03,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2173/ 3125], loss: 0.463, per_step_time: 1413ms, lr: 4.1925005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:03,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.66045 samples/s/p 1:36:02 } +2024-07-30 04:33:06,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2175/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 4.1890917e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:06,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.65793 samples/s/p 1:36:01 } +2024-07-30 04:33:09,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2177/ 3125], loss: 0.359, per_step_time: 1412ms, lr: 4.185682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:09,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.66257 samples/s/p 1:35:54 } +2024-07-30 04:33:12,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2179/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 4.1822736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:12,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.66161 samples/s/p 1:35:52 } +2024-07-30 04:33:15,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2181/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 4.1788658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:15,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.65885 samples/s/p 1:35:52 } +2024-07-30 04:33:17,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2183/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 4.1754583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:17,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.65958 samples/s/p 1:35:48 } +2024-07-30 04:33:20,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2185/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 4.1720496e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:20,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.66091 samples/s/p 1:35:44 } +2024-07-30 04:33:23,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2187/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 4.168643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:23,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.65959 samples/s/p 1:35:43 } +2024-07-30 04:33:26,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2189/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 4.165236e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:26,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.65930 samples/s/p 1:35:40 } +2024-07-30 04:33:29,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2191/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 4.16183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:29,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.66011 samples/s/p 1:35:36 } +2024-07-30 04:33:32,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2193/ 3125], loss: 0.481, per_step_time: 1413ms, lr: 4.1584244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:32,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.65994 samples/s/p 1:35:34 } +2024-07-30 04:33:34,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2195/ 3125], loss: 0.492, per_step_time: 1414ms, lr: 4.1550193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:34,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.65457 samples/s/p 1:35:36 } +2024-07-30 04:33:37,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2197/ 3125], loss: 0.273, per_step_time: 1415ms, lr: 4.1516146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:37,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.65264 samples/s/p 1:35:36 } +2024-07-30 04:33:40,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2199/ 3125], loss: 0.272, per_step_time: 1414ms, lr: 4.148209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:40,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.65759 samples/s/p 1:35:28 } +2024-07-30 04:33:43,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2201/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 4.1448043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:43,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.65914 samples/s/p 1:35:23 } +2024-07-30 04:33:46,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2203/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 4.141401e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:46,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.66013 samples/s/p 1:35:20 } +2024-07-30 04:33:49,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2205/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 4.1379976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:49,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.66141 samples/s/p 1:35:15 } +2024-07-30 04:33:51,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2207/ 3125], loss: 0.235, per_step_time: 1413ms, lr: 4.1345947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:51,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.66140 samples/s/p 1:35:13 } +2024-07-30 04:33:54,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2209/ 3125], loss: 0.401, per_step_time: 1413ms, lr: 4.131192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:54,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.66090 samples/s/p 1:35:10 } +2024-07-30 04:33:57,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2211/ 3125], loss: 0.233, per_step_time: 1412ms, lr: 4.12779e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:57,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.66216 samples/s/p 1:35:06 } +2024-07-30 04:34:00,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2213/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 4.1243875e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:00,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.66144 samples/s/p 1:35:04 } +2024-07-30 04:34:03,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2215/ 3125], loss: 0.232, per_step_time: 1412ms, lr: 4.1209864e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:03,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.66250 samples/s/p 1:35:00 } +2024-07-30 04:34:06,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2217/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 4.117586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:06,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.66024 samples/s/p 1:35:00 } +2024-07-30 04:34:08,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2219/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 4.1141857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:08,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.65966 samples/s/p 1:34:57 } +2024-07-30 04:34:11,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2221/ 3125], loss: 0.216, per_step_time: 1412ms, lr: 4.110785e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:11,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.66216 samples/s/p 1:34:52 } +2024-07-30 04:34:14,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2223/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 4.1073854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:14,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.65773 samples/s/p 1:34:54 } +2024-07-30 04:34:17,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2225/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 4.1039866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:17,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.65909 samples/s/p 1:34:49 } +2024-07-30 04:34:20,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2227/ 3125], loss: 0.265, per_step_time: 1414ms, lr: 4.1005865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:20,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.65456 samples/s/p 1:34:51 } +2024-07-30 04:34:23,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2229/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 4.0971886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:23,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.65897 samples/s/p 1:34:44 } +2024-07-30 04:34:25,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2231/ 3125], loss: 0.579, per_step_time: 1413ms, lr: 4.093791e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:25,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.65787 samples/s/p 1:34:42 } +2024-07-30 04:34:28,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2233/ 3125], loss: 0.166, per_step_time: 1414ms, lr: 4.0903933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:28,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.65727 samples/s/p 1:34:40 } +2024-07-30 04:34:31,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2235/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 4.0869963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:31,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.66037 samples/s/p 1:34:34 } +2024-07-30 04:34:34,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2237/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 4.0836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:34,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.65956 samples/s/p 1:34:32 } +2024-07-30 04:34:37,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2239/ 3125], loss: 0.324, per_step_time: 1414ms, lr: 4.080204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:37,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.65402 samples/s/p 1:34:35 } +2024-07-30 04:34:40,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2241/ 3125], loss: 0.142, per_step_time: 1412ms, lr: 4.0768073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:40,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.66172 samples/s/p 1:34:24 } +2024-07-30 04:34:42,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2243/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 4.073412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:42,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.65856 samples/s/p 1:34:25 } +2024-07-30 04:34:45,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2245/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 4.070017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:45,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.66014 samples/s/p 1:34:20 } +2024-07-30 04:34:48,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2247/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 4.0666228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:48,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.65504 samples/s/p 1:34:22 } +2024-07-30 04:34:51,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2249/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 4.063229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:51,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.66013 samples/s/p 1:34:14 } +2024-07-30 04:34:54,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2251/ 3125], loss: 0.205, per_step_time: 1414ms, lr: 4.0598356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:54,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.65726 samples/s/p 1:34:15 } +2024-07-30 04:34:57,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2253/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 4.056443e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:57,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.66098 samples/s/p 1:34:08 } +2024-07-30 04:34:59,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2255/ 3125], loss: 0.197, per_step_time: 1414ms, lr: 4.0530504e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:59,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.65717 samples/s/p 1:34:09 } +2024-07-30 04:35:02,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2257/ 3125], loss: 0.380, per_step_time: 1414ms, lr: 4.049657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:02,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.65690 samples/s/p 1:34:06 } +2024-07-30 04:35:05,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2259/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 4.0462655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:05,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.66040 samples/s/p 1:34:00 } +2024-07-30 04:35:08,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2261/ 3125], loss: 0.310, per_step_time: 1412ms, lr: 4.0428745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:08,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.66262 samples/s/p 1:33:55 } +2024-07-30 04:35:11,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2263/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 4.039484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:11,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.65900 samples/s/p 1:33:56 } +2024-07-30 04:35:14,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2265/ 3125], loss: 0.197, per_step_time: 1412ms, lr: 4.0360937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:14,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.66303 samples/s/p 1:33:49 } +2024-07-30 04:35:16,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2267/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 4.0327036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:16,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.65795 samples/s/p 1:33:51 } +2024-07-30 04:35:19,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2269/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 4.0293144e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:19,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.66041 samples/s/p 1:33:46 } +2024-07-30 04:35:22,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2271/ 3125], loss: 0.302, per_step_time: 1412ms, lr: 4.025924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:22,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.66254 samples/s/p 1:33:41 } +2024-07-30 04:35:25,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2273/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 4.0225364e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:25,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.66120 samples/s/p 1:33:40 } +2024-07-30 04:35:28,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2275/ 3125], loss: 0.459, per_step_time: 1413ms, lr: 4.019148e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:28,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.66160 samples/s/p 1:33:36 } +2024-07-30 04:35:31,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2277/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 4.015761e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:31,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.66043 samples/s/p 1:33:35 } +2024-07-30 04:35:33,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2279/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 4.0123737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:33,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.66010 samples/s/p 1:33:32 } +2024-07-30 04:35:36,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2281/ 3125], loss: 0.136, per_step_time: 1412ms, lr: 4.008987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:36,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.66253 samples/s/p 1:33:27 } +2024-07-30 04:35:39,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2283/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 4.005601e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:39,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.65940 samples/s/p 1:33:27 } +2024-07-30 04:35:42,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2285/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 4.0022146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:42,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.66086 samples/s/p 1:33:23 } +2024-07-30 04:35:45,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2287/ 3125], loss: 0.440, per_step_time: 1413ms, lr: 3.9988295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:45,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.65887 samples/s/p 1:33:22 } +2024-07-30 04:35:48,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2289/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 3.9954452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:48,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.66028 samples/s/p 1:33:18 } +2024-07-30 04:35:50,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2291/ 3125], loss: 0.377, per_step_time: 1412ms, lr: 3.9920606e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:50,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.66201 samples/s/p 1:33:13 } +2024-07-30 04:35:53,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2293/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 3.9886772e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:53,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.65673 samples/s/p 1:33:16 } +2024-07-30 04:35:56,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2295/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 3.985294e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:56,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.65972 samples/s/p 1:33:10 } +2024-07-30 04:35:59,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2297/ 3125], loss: 0.109, per_step_time: 1414ms, lr: 3.9819115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:59,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.65623 samples/s/p 1:33:10 } +2024-07-30 04:36:02,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2299/ 3125], loss: 0.496, per_step_time: 1413ms, lr: 3.978528e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:02,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.65781 samples/s/p 1:33:06 } +2024-07-30 04:36:05,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2301/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 3.9751467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:05,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.65856 samples/s/p 1:33:03 } +2024-07-30 04:36:07,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2303/ 3125], loss: 0.450, per_step_time: 1414ms, lr: 3.9717647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:07,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.65462 samples/s/p 1:33:04 } +2024-07-30 04:36:10,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2305/ 3125], loss: 0.127, per_step_time: 1413ms, lr: 3.9683846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:10,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.65774 samples/s/p 1:32:58 } +2024-07-30 04:36:13,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2307/ 3125], loss: 0.341, per_step_time: 1413ms, lr: 3.9650045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:13,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.66001 samples/s/p 1:32:53 } +2024-07-30 04:36:16,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2309/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 3.9616248e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:16,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |████████████████████████████ | 5.66140 samples/s/p 1:32:48 } +2024-07-30 04:36:19,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2311/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 3.958245e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:19,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |████████████████████████████ | 5.65987 samples/s/p 1:32:47 } +2024-07-30 04:36:22,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2313/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 3.9548663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:22,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.65996 samples/s/p 1:32:44 } +2024-07-30 04:36:24,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2315/ 3125], loss: 0.234, per_step_time: 1412ms, lr: 3.951487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:24,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.66244 samples/s/p 1:32:39 } +2024-07-30 04:36:27,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2317/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 3.9481097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:27,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.66024 samples/s/p 1:32:38 } +2024-07-30 04:36:30,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2319/ 3125], loss: 0.322, per_step_time: 1413ms, lr: 3.9447323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:30,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.65986 samples/s/p 1:32:36 } +2024-07-30 04:36:33,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2321/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 3.9413558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:33,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.66120 samples/s/p 1:32:32 } +2024-07-30 04:36:36,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2323/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 3.9379793e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:36,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.65973 samples/s/p 1:32:30 } +2024-07-30 04:36:39,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2325/ 3125], loss: 0.107, per_step_time: 1412ms, lr: 3.9346037e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:39,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.66237 samples/s/p 1:32:25 } +2024-07-30 04:36:41,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2327/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 3.9312285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:41,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.65931 samples/s/p 1:32:25 } +2024-07-30 04:36:44,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2329/ 3125], loss: 0.462, per_step_time: 1413ms, lr: 3.9278525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:44,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.66132 samples/s/p 1:32:20 } +2024-07-30 04:36:47,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2331/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 3.9244787e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:47,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.66118 samples/s/p 1:32:18 } +2024-07-30 04:36:50,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2333/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 3.921105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:50,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.65955 samples/s/p 1:32:16 } +2024-07-30 04:36:53,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2335/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 3.9177316e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:53,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.65865 samples/s/p 1:32:14 } +2024-07-30 04:36:56,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2337/ 3125], loss: 0.206, per_step_time: 1417ms, lr: 3.914359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:56,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.64249 samples/s/p 1:32:27 } +2024-07-30 04:36:58,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2339/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 3.910987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:58,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.65843 samples/s/p 1:32:09 } +2024-07-30 04:37:01,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2341/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 3.9076153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:01,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.65877 samples/s/p 1:32:06 } +2024-07-30 04:37:04,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2343/ 3125], loss: 0.305, per_step_time: 1414ms, lr: 3.9042434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:04,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.65591 samples/s/p 1:32:06 } +2024-07-30 04:37:07,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2345/ 3125], loss: 0.082, per_step_time: 1413ms, lr: 3.900873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:07,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.65994 samples/s/p 1:31:59 } +2024-07-30 04:37:10,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2347/ 3125], loss: 0.097, per_step_time: 1414ms, lr: 3.897502e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:10,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.65658 samples/s/p 1:31:59 } +2024-07-30 04:37:13,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2349/ 3125], loss: 0.252, per_step_time: 1412ms, lr: 3.894133e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:13,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.66187 samples/s/p 1:31:51 } +2024-07-30 04:37:15,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2351/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 3.890764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:15,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.65793 samples/s/p 1:31:52 } +2024-07-30 04:37:18,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2353/ 3125], loss: 0.421, per_step_time: 1413ms, lr: 3.887396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:18,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.65984 samples/s/p 1:31:48 } +2024-07-30 04:37:21,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2355/ 3125], loss: 0.323, per_step_time: 1412ms, lr: 3.8840276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:21,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.66245 samples/s/p 1:31:42 } +2024-07-30 04:37:24,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2357/ 3125], loss: 0.412, per_step_time: 1414ms, lr: 3.8806597e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:24,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.65487 samples/s/p 1:31:47 } +2024-07-30 04:37:27,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2359/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 3.8772923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:27,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.65973 samples/s/p 1:31:39 } +2024-07-30 04:37:30,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2361/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 3.873926e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:30,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.65867 samples/s/p 1:31:38 } +2024-07-30 04:37:32,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2363/ 3125], loss: 0.151, per_step_time: 1415ms, lr: 3.8705602e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:32,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.65186 samples/s/p 1:31:41 } +2024-07-30 04:37:35,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2365/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 3.867195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:35,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.65849 samples/s/p 1:31:32 } +2024-07-30 04:37:38,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2367/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 3.86383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:38,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.65872 samples/s/p 1:31:29 } +2024-07-30 04:37:41,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2369/ 3125], loss: 0.330, per_step_time: 1415ms, lr: 3.8604658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:41,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.65185 samples/s/p 1:31:33 } +2024-07-30 04:37:44,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2371/ 3125], loss: 0.040, per_step_time: 1414ms, lr: 3.8571015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:44,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.65574 samples/s/p 1:31:26 } +2024-07-30 04:37:47,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2373/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 3.8537382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:47,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.66160 samples/s/p 1:31:18 } +2024-07-30 04:37:49,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2375/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 3.850376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:49,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.65814 samples/s/p 1:31:18 } +2024-07-30 04:37:52,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2377/ 3125], loss: 0.421, per_step_time: 1413ms, lr: 3.8470143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:52,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.66079 samples/s/p 1:31:13 } +2024-07-30 04:37:55,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2379/ 3125], loss: 0.048, per_step_time: 1413ms, lr: 3.8436524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:55,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.66031 samples/s/p 1:31:11 } +2024-07-30 04:37:58,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2381/ 3125], loss: 0.364, per_step_time: 1416ms, lr: 3.8402914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:58,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.64732 samples/s/p 1:31:20 } +2024-07-30 04:38:01,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2383/ 3125], loss: 0.176, per_step_time: 1413ms, lr: 3.8369312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:01,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.65806 samples/s/p 1:31:07 } +2024-07-30 04:38:04,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2385/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 3.8335716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:04,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.65953 samples/s/p 1:31:03 } +2024-07-30 04:38:07,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2387/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 3.8302114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:07,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.65944 samples/s/p 1:31:00 } +2024-07-30 04:38:09,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2389/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 3.826853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:09,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.66113 samples/s/p 1:30:56 } +2024-07-30 04:38:12,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2391/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 3.8234944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:12,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.66062 samples/s/p 1:30:53 } +2024-07-30 04:38:15,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2393/ 3125], loss: 0.215, per_step_time: 1414ms, lr: 3.820137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:15,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.65689 samples/s/p 1:30:54 } +2024-07-30 04:38:18,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2395/ 3125], loss: 0.094, per_step_time: 1413ms, lr: 3.81678e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:18,341 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.65926 samples/s/p 1:30:49 } +2024-07-30 04:38:21,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2397/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 3.8134237e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:21,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.66067 samples/s/p 1:30:45 } +2024-07-30 04:38:24,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2399/ 3125], loss: 0.156, per_step_time: 1415ms, lr: 3.8100677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:24,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.65300 samples/s/p 1:30:49 } +2024-07-30 04:38:26,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2401/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 3.806712e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:26,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.65888 samples/s/p 1:30:41 } +2024-07-30 04:38:29,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2403/ 3125], loss: 0.595, per_step_time: 1413ms, lr: 3.8033568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:29,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.65903 samples/s/p 1:30:38 } +2024-07-30 04:38:32,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2405/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 3.8000028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:32,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.65900 samples/s/p 1:30:35 } +2024-07-30 04:38:35,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2407/ 3125], loss: 0.425, per_step_time: 1414ms, lr: 3.7966493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:35,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.65575 samples/s/p 1:30:35 } +2024-07-30 04:38:38,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2409/ 3125], loss: 0.322, per_step_time: 1414ms, lr: 3.7932964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:38,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.65716 samples/s/p 1:30:31 } +2024-07-30 04:38:41,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2411/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 3.7899433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:41,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.66010 samples/s/p 1:30:26 } +2024-07-30 04:38:43,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2413/ 3125], loss: 0.084, per_step_time: 1413ms, lr: 3.7865918e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:43,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.66052 samples/s/p 1:30:22 } +2024-07-30 04:38:46,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2415/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 3.7832397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:46,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.66114 samples/s/p 1:30:19 } +2024-07-30 04:38:49,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2417/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 3.7798889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:49,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.66017 samples/s/p 1:30:17 } +2024-07-30 04:38:52,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2419/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 3.7765392e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:52,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.65894 samples/s/p 1:30:15 } +2024-07-30 04:38:55,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2421/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 3.7731897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:55,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.66062 samples/s/p 1:30:11 } +2024-07-30 04:38:58,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2423/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 3.7698403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:58,022 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.65804 samples/s/p 1:30:11 } +2024-07-30 04:39:00,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2425/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 3.7664922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:00,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.66020 samples/s/p 1:30:06 } +2024-07-30 04:39:03,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2427/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 3.7631446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:03,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.65884 samples/s/p 1:30:04 } +2024-07-30 04:39:06,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2429/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 3.7597963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:06,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.66000 samples/s/p 1:30:00 } +2024-07-30 04:39:09,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2431/ 3125], loss: 0.176, per_step_time: 1413ms, lr: 3.7564498e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:09,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.66088 samples/s/p 1:29:57 } +2024-07-30 04:39:12,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2433/ 3125], loss: 0.214, per_step_time: 1414ms, lr: 3.753104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:12,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.65524 samples/s/p 1:29:59 } +2024-07-30 04:39:15,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2435/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 3.7497582e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:15,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.65918 samples/s/p 1:29:53 } +2024-07-30 04:39:17,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2437/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 3.7464135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:17,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.65995 samples/s/p 1:29:49 } +2024-07-30 04:39:20,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2439/ 3125], loss: 0.328, per_step_time: 1415ms, lr: 3.7430698e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:20,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.65107 samples/s/p 1:29:55 } +2024-07-30 04:39:23,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2441/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 3.7397258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:23,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.65852 samples/s/p 1:29:45 } +2024-07-30 04:39:26,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2443/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 3.736382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:26,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.66038 samples/s/p 1:29:40 } +2024-07-30 04:39:29,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2445/ 3125], loss: 0.225, per_step_time: 1414ms, lr: 3.73304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:29,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.65663 samples/s/p 1:29:41 } +2024-07-30 04:39:32,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2447/ 3125], loss: 0.306, per_step_time: 1415ms, lr: 3.7296977e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:32,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.65110 samples/s/p 1:29:43 } +2024-07-30 04:39:34,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2449/ 3125], loss: 0.268, per_step_time: 1413ms, lr: 3.7263565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:34,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.65840 samples/s/p 1:29:33 } +2024-07-30 04:39:37,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2451/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 3.7230163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:37,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.65964 samples/s/p 1:29:29 } +2024-07-30 04:39:40,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2453/ 3125], loss: 0.315, per_step_time: 1414ms, lr: 3.7196764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:40,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.65759 samples/s/p 1:29:29 } +2024-07-30 04:39:43,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2455/ 3125], loss: 0.526, per_step_time: 1413ms, lr: 3.7163363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:43,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.65910 samples/s/p 1:29:24 } +2024-07-30 04:39:46,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2457/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 3.712998e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:46,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.66056 samples/s/p 1:29:20 } +2024-07-30 04:39:49,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2459/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 3.7096588e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:49,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.66118 samples/s/p 1:29:17 } +2024-07-30 04:39:51,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2461/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 3.7063216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:51,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.66090 samples/s/p 1:29:14 } +2024-07-30 04:39:54,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2463/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 3.7029847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:54,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.65974 samples/s/p 1:29:12 } +2024-07-30 04:39:57,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2465/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 3.6996487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:57,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.66012 samples/s/p 1:29:09 } +2024-07-30 04:40:00,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2467/ 3125], loss: 0.109, per_step_time: 1413ms, lr: 3.6963124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:00,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.65918 samples/s/p 1:29:07 } +2024-07-30 04:40:03,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2469/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 3.6929775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:03,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.65938 samples/s/p 1:29:04 } +2024-07-30 04:40:06,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2471/ 3125], loss: 0.391, per_step_time: 1413ms, lr: 3.6896433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:06,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.66141 samples/s/p 1:29:00 } +2024-07-30 04:40:08,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2473/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 3.6863087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:08,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.65831 samples/s/p 1:29:00 } +2024-07-30 04:40:11,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2475/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 3.6829756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:11,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.66116 samples/s/p 1:28:54 } +2024-07-30 04:40:11,714 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 04:40:46,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2477/ 3125], loss: 0.064, per_step_time: 1695ms, lr: 3.6796432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:46,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 4.71857 samples/s/p 1:46:36 } +2024-07-30 04:40:49,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2479/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 3.676311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:49,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.65853 samples/s/p 1:28:51 } +2024-07-30 04:40:51,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2481/ 3125], loss: 0.274, per_step_time: 1412ms, lr: 3.67298e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:51,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.66207 samples/s/p 1:28:45 } +2024-07-30 04:40:54,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2483/ 3125], loss: 0.118, per_step_time: 1413ms, lr: 3.6696492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:54,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.65970 samples/s/p 1:28:44 } +2024-07-30 04:40:57,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2485/ 3125], loss: 0.181, per_step_time: 1415ms, lr: 3.6663198e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:57,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.65013 samples/s/p 1:28:50 } +2024-07-30 04:41:00,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2487/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 3.662989e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:00,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.65881 samples/s/p 1:28:39 } +2024-07-30 04:41:03,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2489/ 3125], loss: 0.297, per_step_time: 1416ms, lr: 3.6596607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:03,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.64938 samples/s/p 1:28:45 } +2024-07-30 04:41:06,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2491/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 3.6563322e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:06,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.66134 samples/s/p 1:28:31 } +2024-07-30 04:41:08,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2493/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 3.6530046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:08,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.65908 samples/s/p 1:28:31 } +2024-07-30 04:41:11,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2495/ 3125], loss: 0.270, per_step_time: 1414ms, lr: 3.649678e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:11,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.65696 samples/s/p 1:28:30 } +2024-07-30 04:41:14,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2497/ 3125], loss: 0.399, per_step_time: 1413ms, lr: 3.6463523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:14,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |█████████████████████████████ | 5.65834 samples/s/p 1:28:26 } +2024-07-30 04:41:17,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2499/ 3125], loss: 0.359, per_step_time: 1414ms, lr: 3.6430263e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:17,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |█████████████████████████████ | 5.65765 samples/s/p 1:28:23 } +2024-07-30 04:41:20,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2501/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 3.639701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:20,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.65991 samples/s/p 1:28:19 } +2024-07-30 04:41:23,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2503/ 3125], loss: 0.176, per_step_time: 1413ms, lr: 3.6363765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:23,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.65877 samples/s/p 1:28:17 } +2024-07-30 04:41:25,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2505/ 3125], loss: 0.574, per_step_time: 1424ms, lr: 3.633053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:25,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.61458 samples/s/p 1:28:56 } +2024-07-30 04:41:28,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2507/ 3125], loss: 0.181, per_step_time: 1415ms, lr: 3.6297301e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:28,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.65199 samples/s/p 1:28:17 } +2024-07-30 04:41:31,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2509/ 3125], loss: 0.202, per_step_time: 1414ms, lr: 3.6264082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:31,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.65693 samples/s/p 1:28:10 } +2024-07-30 04:41:34,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2511/ 3125], loss: 0.570, per_step_time: 1415ms, lr: 3.623086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:34,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.65364 samples/s/p 1:28:10 } +2024-07-30 04:41:37,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2513/ 3125], loss: 0.220, per_step_time: 1412ms, lr: 3.6197655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:37,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.66187 samples/s/p 1:28:00 } +2024-07-30 04:41:40,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2515/ 3125], loss: 0.619, per_step_time: 1413ms, lr: 3.616444e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:40,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.65846 samples/s/p 1:28:00 } +2024-07-30 04:41:42,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2517/ 3125], loss: 0.422, per_step_time: 1414ms, lr: 3.6131246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:42,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.65553 samples/s/p 1:28:00 } +2024-07-30 04:41:45,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2519/ 3125], loss: 0.370, per_step_time: 1414ms, lr: 3.6098056e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:45,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.65510 samples/s/p 1:27:58 } +2024-07-30 04:41:48,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2521/ 3125], loss: 0.499, per_step_time: 1413ms, lr: 3.6064878e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:48,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.66072 samples/s/p 1:27:49 } +2024-07-30 04:41:51,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2523/ 3125], loss: 0.164, per_step_time: 1429ms, lr: 3.6031697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:51,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.59603 samples/s/p 1:28:48 } +2024-07-30 04:41:54,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2525/ 3125], loss: 0.048, per_step_time: 1413ms, lr: 3.5998528e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:54,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.66111 samples/s/p 1:27:43 } +2024-07-30 04:41:57,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2527/ 3125], loss: 0.453, per_step_time: 1414ms, lr: 3.5965368e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:57,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.65498 samples/s/p 1:27:46 } +2024-07-30 04:42:00,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2529/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 3.5932212e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:00,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.65871 samples/s/p 1:27:40 } +2024-07-30 04:42:02,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2531/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 3.5899054e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:02,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.65916 samples/s/p 1:27:37 } +2024-07-30 04:42:05,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2533/ 3125], loss: 0.200, per_step_time: 1414ms, lr: 3.5865914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:05,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.65711 samples/s/p 1:27:36 } +2024-07-30 04:42:08,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2535/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 3.5832775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:08,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.65908 samples/s/p 1:27:31 } +2024-07-30 04:42:11,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2537/ 3125], loss: 0.054, per_step_time: 1414ms, lr: 3.5799646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:11,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.65753 samples/s/p 1:27:30 } +2024-07-30 04:42:14,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2539/ 3125], loss: 0.462, per_step_time: 1413ms, lr: 3.5766523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:14,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.65832 samples/s/p 1:27:26 } +2024-07-30 04:42:17,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2541/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 3.573341e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:17,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.66111 samples/s/p 1:27:21 } +2024-07-30 04:42:19,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2543/ 3125], loss: 0.343, per_step_time: 1414ms, lr: 3.5700302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:19,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.65682 samples/s/p 1:27:22 } +2024-07-30 04:42:22,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2545/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 3.5667192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:22,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.66155 samples/s/p 1:27:15 } +2024-07-30 04:42:25,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2547/ 3125], loss: 0.118, per_step_time: 1415ms, lr: 3.563409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:25,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.65316 samples/s/p 1:27:20 } +2024-07-30 04:42:28,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2549/ 3125], loss: 0.230, per_step_time: 1414ms, lr: 3.5601004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:28,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.65712 samples/s/p 1:27:13 } +2024-07-30 04:42:31,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2551/ 3125], loss: 0.222, per_step_time: 1412ms, lr: 3.5567923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:31,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.66185 samples/s/p 1:27:06 } +2024-07-30 04:42:34,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2553/ 3125], loss: 0.078, per_step_time: 1414ms, lr: 3.5534852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:34,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.65503 samples/s/p 1:27:10 } +2024-07-30 04:42:36,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2555/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 3.5501782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:36,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.65460 samples/s/p 1:27:07 } +2024-07-30 04:42:39,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2557/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 3.546872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:39,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.65963 samples/s/p 1:27:00 } +2024-07-30 04:42:42,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2559/ 3125], loss: 0.431, per_step_time: 1413ms, lr: 3.5435658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:42,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.66056 samples/s/p 1:26:56 } +2024-07-30 04:42:45,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2561/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 3.5402613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:45,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.66137 samples/s/p 1:26:52 } +2024-07-30 04:42:48,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2563/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 3.5369574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:48,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.66002 samples/s/p 1:26:51 } +2024-07-30 04:42:51,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2565/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 3.533654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:51,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.66142 samples/s/p 1:26:47 } +2024-07-30 04:42:53,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2567/ 3125], loss: 0.426, per_step_time: 1413ms, lr: 3.5303517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:53,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.65929 samples/s/p 1:26:46 } +2024-07-30 04:42:56,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2569/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 3.5270493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:56,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.66022 samples/s/p 1:26:42 } +2024-07-30 04:42:59,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2571/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 3.5237483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:59,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.66026 samples/s/p 1:26:39 } +2024-07-30 04:43:02,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2573/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 3.5204469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:02,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.65893 samples/s/p 1:26:38 } +2024-07-30 04:43:05,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2575/ 3125], loss: 0.327, per_step_time: 1414ms, lr: 3.5171472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:05,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.65530 samples/s/p 1:26:38 } +2024-07-30 04:43:08,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2577/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 3.5138485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:08,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.66020 samples/s/p 1:26:31 } +2024-07-30 04:43:10,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2579/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 3.5105502e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:10,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.65673 samples/s/p 1:26:31 } +2024-07-30 04:43:13,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2581/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 3.5072524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:13,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.66000 samples/s/p 1:26:25 } +2024-07-30 04:43:16,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2583/ 3125], loss: 0.098, per_step_time: 1413ms, lr: 3.5039554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:16,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.65920 samples/s/p 1:26:23 } +2024-07-30 04:43:19,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2585/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 3.5006594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:19,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.65873 samples/s/p 1:26:21 } +2024-07-30 04:43:22,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2587/ 3125], loss: 0.173, per_step_time: 1415ms, lr: 3.4973639e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:22,245 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.65258 samples/s/p 1:26:24 } +2024-07-30 04:43:25,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2589/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 3.4940683e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:25,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.65954 samples/s/p 1:26:14 } +2024-07-30 04:43:27,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2591/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 3.4907746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:27,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.66098 samples/s/p 1:26:10 } +2024-07-30 04:43:30,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2593/ 3125], loss: 0.070, per_step_time: 1414ms, lr: 3.4874804e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:30,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.65429 samples/s/p 1:26:14 } +2024-07-30 04:43:33,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2595/ 3125], loss: 0.266, per_step_time: 1414ms, lr: 3.4841883e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:33,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.65684 samples/s/p 1:26:08 } +2024-07-30 04:43:36,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2597/ 3125], loss: 0.341, per_step_time: 1414ms, lr: 3.4808963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:36,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.65667 samples/s/p 1:26:06 } +2024-07-30 04:43:39,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2599/ 3125], loss: 0.383, per_step_time: 1414ms, lr: 3.4776056e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:39,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.65442 samples/s/p 1:26:05 } +2024-07-30 04:43:42,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2601/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 3.4743143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:42,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.65996 samples/s/p 1:25:57 } +2024-07-30 04:43:44,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2603/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 3.4710242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:44,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.65938 samples/s/p 1:25:55 } +2024-07-30 04:43:47,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2605/ 3125], loss: 0.440, per_step_time: 1413ms, lr: 3.467735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:47,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.65978 samples/s/p 1:25:52 } +2024-07-30 04:43:50,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2607/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 3.4644468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:50,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.65864 samples/s/p 1:25:50 } +2024-07-30 04:43:53,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2609/ 3125], loss: 0.295, per_step_time: 1414ms, lr: 3.4611594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:53,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.65757 samples/s/p 1:25:48 } +2024-07-30 04:43:56,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2611/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 3.4578727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:56,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.65982 samples/s/p 1:25:43 } +2024-07-30 04:43:59,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2613/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 3.4545865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:59,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.66043 samples/s/p 1:25:40 } +2024-07-30 04:44:01,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2615/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 3.4513014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:01,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.66076 samples/s/p 1:25:37 } +2024-07-30 04:44:04,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2617/ 3125], loss: 0.123, per_step_time: 1413ms, lr: 3.4480156e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:04,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.65848 samples/s/p 1:25:36 } +2024-07-30 04:44:07,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2619/ 3125], loss: 0.152, per_step_time: 1414ms, lr: 3.444732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:07,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.65722 samples/s/p 1:25:34 } +2024-07-30 04:44:10,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2621/ 3125], loss: 0.879, per_step_time: 1413ms, lr: 3.4414493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:10,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.65829 samples/s/p 1:25:30 } +2024-07-30 04:44:13,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2623/ 3125], loss: 0.192, per_step_time: 1415ms, lr: 3.438167e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:13,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.65123 samples/s/p 1:25:34 } +2024-07-30 04:44:16,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2625/ 3125], loss: 0.056, per_step_time: 1418ms, lr: 3.434885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:16,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.63998 samples/s/p 1:25:41 } +2024-07-30 04:44:18,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2627/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 3.4316042e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:18,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.65993 samples/s/p 1:25:20 } +2024-07-30 04:44:21,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2629/ 3125], loss: 0.289, per_step_time: 1412ms, lr: 3.4283244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:21,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.66196 samples/s/p 1:25:16 } +2024-07-30 04:44:24,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2631/ 3125], loss: 0.300, per_step_time: 1412ms, lr: 3.4250438e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:24,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.66175 samples/s/p 1:25:13 } +2024-07-30 04:44:27,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2633/ 3125], loss: 0.124, per_step_time: 1415ms, lr: 3.4217655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:27,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.65100 samples/s/p 1:25:20 } +2024-07-30 04:44:30,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2635/ 3125], loss: 0.221, per_step_time: 1412ms, lr: 3.4184877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:30,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.66240 samples/s/p 1:25:07 } +2024-07-30 04:44:33,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2637/ 3125], loss: 0.199, per_step_time: 1414ms, lr: 3.4152101e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:33,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.65765 samples/s/p 1:25:08 } +2024-07-30 04:44:35,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2639/ 3125], loss: 0.533, per_step_time: 1413ms, lr: 3.4119344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:35,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.65893 samples/s/p 1:25:04 } +2024-07-30 04:44:38,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2641/ 3125], loss: 0.310, per_step_time: 1415ms, lr: 3.4086588e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:38,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.65324 samples/s/p 1:25:07 } +2024-07-30 04:44:41,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2643/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 3.405384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:41,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.65921 samples/s/p 1:24:58 } +2024-07-30 04:44:44,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2645/ 3125], loss: 0.170, per_step_time: 1412ms, lr: 3.402109e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:44,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.66336 samples/s/p 1:24:52 } +2024-07-30 04:44:47,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2647/ 3125], loss: 0.377, per_step_time: 1413ms, lr: 3.3988356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:47,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.65804 samples/s/p 1:24:54 } +2024-07-30 04:44:50,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2649/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 3.3955628e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:50,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.65982 samples/s/p 1:24:49 } +2024-07-30 04:44:52,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2651/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 3.3922913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:52,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.65959 samples/s/p 1:24:47 } +2024-07-30 04:44:55,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2653/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 3.3890205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:55,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.65957 samples/s/p 1:24:44 } +2024-07-30 04:44:58,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2655/ 3125], loss: 0.244, per_step_time: 1414ms, lr: 3.3857502e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:58,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.65586 samples/s/p 1:24:44 } +2024-07-30 04:45:01,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2657/ 3125], loss: 0.175, per_step_time: 1414ms, lr: 3.3824806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:01,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.65766 samples/s/p 1:24:40 } +2024-07-30 04:45:04,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2659/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 3.3792119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:04,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.65955 samples/s/p 1:24:36 } +2024-07-30 04:45:07,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2661/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 3.3759432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:07,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.65951 samples/s/p 1:24:33 } +2024-07-30 04:45:09,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2663/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 3.3726762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:09,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.65914 samples/s/p 1:24:30 } +2024-07-30 04:45:12,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2665/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 3.36941e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:12,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.65954 samples/s/p 1:24:27 } +2024-07-30 04:45:15,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2667/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 3.3661445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:15,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.66034 samples/s/p 1:24:24 } +2024-07-30 04:45:18,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2669/ 3125], loss: 0.181, per_step_time: 1414ms, lr: 3.3628792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:18,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.65768 samples/s/p 1:24:23 } +2024-07-30 04:45:21,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2671/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 3.3596154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:21,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.66041 samples/s/p 1:24:18 } +2024-07-30 04:45:24,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2673/ 3125], loss: 0.335, per_step_time: 1413ms, lr: 3.3563524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:24,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.66101 samples/s/p 1:24:14 } +2024-07-30 04:45:26,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2675/ 3125], loss: 0.167, per_step_time: 1412ms, lr: 3.353089e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:26,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.66177 samples/s/p 1:24:11 } +2024-07-30 04:45:29,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2677/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 3.3498275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:29,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.65844 samples/s/p 1:24:11 } +2024-07-30 04:45:32,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2679/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 3.3465665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:32,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.65825 samples/s/p 1:24:08 } +2024-07-30 04:45:35,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2681/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 3.3433062e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:35,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.66069 samples/s/p 1:24:03 } +2024-07-30 04:45:38,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2683/ 3125], loss: 0.151, per_step_time: 1413ms, lr: 3.340047e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:38,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.65865 samples/s/p 1:24:02 } +2024-07-30 04:45:41,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2685/ 3125], loss: 0.134, per_step_time: 1414ms, lr: 3.3367887e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:41,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.65388 samples/s/p 1:24:04 } +2024-07-30 04:45:43,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2687/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 3.333531e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:43,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.66143 samples/s/p 1:23:54 } +2024-07-30 04:45:46,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2689/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 3.3302733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:46,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |███████████████████████████████ | 5.65938 samples/s/p 1:23:53 } +2024-07-30 04:45:49,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2691/ 3125], loss: 0.316, per_step_time: 1412ms, lr: 3.3270173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:49,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |███████████████████████████████ | 5.66174 samples/s/p 1:23:48 } +2024-07-30 04:45:52,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2693/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 3.3237618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:52,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.65951 samples/s/p 1:23:47 } +2024-07-30 04:45:55,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2695/ 3125], loss: 0.215, per_step_time: 1416ms, lr: 3.3205074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:55,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.64663 samples/s/p 1:23:56 } +2024-07-30 04:45:58,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2697/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 3.3172535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:58,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.65945 samples/s/p 1:23:42 } +2024-07-30 04:46:00,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2699/ 3125], loss: 0.429, per_step_time: 1413ms, lr: 3.3140009e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:00,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.65960 samples/s/p 1:23:39 } +2024-07-30 04:46:03,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2701/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 3.3107483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:03,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.65950 samples/s/p 1:23:36 } +2024-07-30 04:46:06,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2703/ 3125], loss: 0.354, per_step_time: 1414ms, lr: 3.3074969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:06,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.65695 samples/s/p 1:23:36 } +2024-07-30 04:46:09,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2705/ 3125], loss: 0.235, per_step_time: 1413ms, lr: 3.3042456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:09,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.65984 samples/s/p 1:23:30 } +2024-07-30 04:46:12,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2707/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 3.3009962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:12,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.66021 samples/s/p 1:23:27 } +2024-07-30 04:46:15,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2709/ 3125], loss: 0.192, per_step_time: 1414ms, lr: 3.2977473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:15,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.65394 samples/s/p 1:23:30 } +2024-07-30 04:46:17,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2711/ 3125], loss: 0.232, per_step_time: 1414ms, lr: 3.2944995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:17,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.65507 samples/s/p 1:23:26 } +2024-07-30 04:46:20,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2713/ 3125], loss: 0.175, per_step_time: 1415ms, lr: 3.291252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:20,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.65052 samples/s/p 1:23:27 } +2024-07-30 04:46:23,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2715/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 3.2880055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:23,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.66005 samples/s/p 1:23:16 } +2024-07-30 04:46:26,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2717/ 3125], loss: 0.102, per_step_time: 1413ms, lr: 3.2847588e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:26,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.66150 samples/s/p 1:23:12 } +2024-07-30 04:46:29,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2719/ 3125], loss: 0.109, per_step_time: 1413ms, lr: 3.2815146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:29,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.66002 samples/s/p 1:23:10 } +2024-07-30 04:46:32,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2721/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 3.2782705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:32,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.66085 samples/s/p 1:23:07 } +2024-07-30 04:46:35,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2723/ 3125], loss: 0.164, per_step_time: 1413ms, lr: 3.275028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:35,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.65964 samples/s/p 1:23:05 } +2024-07-30 04:46:37,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2725/ 3125], loss: 0.292, per_step_time: 1413ms, lr: 3.2717846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:37,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.66022 samples/s/p 1:23:02 } +2024-07-30 04:46:40,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2727/ 3125], loss: 0.052, per_step_time: 1413ms, lr: 3.2685434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:40,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.66052 samples/s/p 1:22:59 } +2024-07-30 04:46:43,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2729/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 3.265303e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:43,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.65887 samples/s/p 1:22:57 } +2024-07-30 04:46:46,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2731/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 3.2620633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:46,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.66042 samples/s/p 1:22:53 } +2024-07-30 04:46:49,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2733/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 3.2588234e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:49,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.65934 samples/s/p 1:22:51 } +2024-07-30 04:46:52,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2735/ 3125], loss: 0.177, per_step_time: 1414ms, lr: 3.2555854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:52,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.65759 samples/s/p 1:22:50 } +2024-07-30 04:46:54,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2737/ 3125], loss: 0.227, per_step_time: 1414ms, lr: 3.2523476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:54,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.65715 samples/s/p 1:22:47 } +2024-07-30 04:46:57,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2739/ 3125], loss: 0.217, per_step_time: 1428ms, lr: 3.2491112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:57,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.60044 samples/s/p 1:23:35 } +2024-07-30 04:47:00,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2741/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 3.2458759e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:00,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.66018 samples/s/p 1:22:39 } +2024-07-30 04:47:03,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2743/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 3.242641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:03,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.65803 samples/s/p 1:22:38 } +2024-07-30 04:47:06,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2745/ 3125], loss: 0.425, per_step_time: 1413ms, lr: 3.2394066e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:06,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.66122 samples/s/p 1:22:32 } +2024-07-30 04:47:09,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2747/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 3.236173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:09,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.65964 samples/s/p 1:22:31 } +2024-07-30 04:47:11,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2749/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 3.2329403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:11,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.66082 samples/s/p 1:22:27 } +2024-07-30 04:47:14,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2751/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 3.2297091e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:14,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.66087 samples/s/p 1:22:24 } +2024-07-30 04:47:17,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2753/ 3125], loss: 0.145, per_step_time: 1413ms, lr: 3.2264786e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:17,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.65869 samples/s/p 1:22:23 } +2024-07-30 04:47:20,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2755/ 3125], loss: 0.465, per_step_time: 1413ms, lr: 3.2232485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:20,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.65860 samples/s/p 1:22:21 } +2024-07-30 04:47:23,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2757/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 3.2200196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:23,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.66003 samples/s/p 1:22:17 } +2024-07-30 04:47:26,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2759/ 3125], loss: 0.294, per_step_time: 1413ms, lr: 3.2167916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:26,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.65919 samples/s/p 1:22:14 } +2024-07-30 04:47:28,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2761/ 3125], loss: 0.275, per_step_time: 1414ms, lr: 3.2135636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:28,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.65652 samples/s/p 1:22:14 } +2024-07-30 04:47:31,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2763/ 3125], loss: 0.136, per_step_time: 1413ms, lr: 3.2103371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:31,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.65890 samples/s/p 1:22:09 } +2024-07-30 04:47:34,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2765/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 3.2071118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:34,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.65903 samples/s/p 1:22:06 } +2024-07-30 04:47:37,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2767/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 3.2038872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:37,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.65859 samples/s/p 1:22:04 } +2024-07-30 04:47:40,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2769/ 3125], loss: 0.434, per_step_time: 1413ms, lr: 3.200663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:40,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.66068 samples/s/p 1:21:59 } +2024-07-30 04:47:43,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2771/ 3125], loss: 0.446, per_step_time: 1413ms, lr: 3.1974405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:43,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.65887 samples/s/p 1:21:58 } +2024-07-30 04:47:45,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2773/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 3.1942182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:45,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.65803 samples/s/p 1:21:56 } +2024-07-30 04:47:48,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2775/ 3125], loss: 0.213, per_step_time: 1414ms, lr: 3.190996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:48,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.65687 samples/s/p 1:21:54 } +2024-07-30 04:47:51,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2777/ 3125], loss: 0.291, per_step_time: 1415ms, lr: 3.1877757e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:51,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.65143 samples/s/p 1:21:56 } +2024-07-30 04:47:54,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2779/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 3.1845566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:54,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.66096 samples/s/p 1:21:45 } +2024-07-30 04:47:57,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2781/ 3125], loss: 0.353, per_step_time: 1413ms, lr: 3.1813377e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:57,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.66000 samples/s/p 1:21:43 } +2024-07-30 04:48:00,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2783/ 3125], loss: 0.294, per_step_time: 1413ms, lr: 3.1781199e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:00,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.66149 samples/s/p 1:21:39 } +2024-07-30 04:48:02,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2785/ 3125], loss: 0.113, per_step_time: 1413ms, lr: 3.1749032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:02,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.65963 samples/s/p 1:21:37 } +2024-07-30 04:48:05,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2787/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 3.171687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:05,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.66102 samples/s/p 1:21:33 } +2024-07-30 04:48:08,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2789/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 3.1684717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:08,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.66069 samples/s/p 1:21:31 } +2024-07-30 04:48:11,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2791/ 3125], loss: 0.480, per_step_time: 1412ms, lr: 3.1652569e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:11,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.66188 samples/s/p 1:21:27 } +2024-07-30 04:48:14,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2793/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 3.162043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:14,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.65988 samples/s/p 1:21:26 } +2024-07-30 04:48:17,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2795/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 3.1588309e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:17,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.65838 samples/s/p 1:21:24 } +2024-07-30 04:48:19,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2797/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 3.1556194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:19,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.66062 samples/s/p 1:21:20 } +2024-07-30 04:48:22,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2799/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 3.152409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:22,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.65956 samples/s/p 1:21:18 } +2024-07-30 04:48:25,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2801/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 3.1491986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:25,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.66045 samples/s/p 1:21:14 } +2024-07-30 04:48:28,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2803/ 3125], loss: 0.385, per_step_time: 1414ms, lr: 3.1459897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:28,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.65546 samples/s/p 1:21:15 } +2024-07-30 04:48:31,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2805/ 3125], loss: 0.419, per_step_time: 1413ms, lr: 3.1427805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:31,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.66166 samples/s/p 1:21:07 } +2024-07-30 04:48:34,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2807/ 3125], loss: 0.359, per_step_time: 1414ms, lr: 3.1395732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:34,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.65738 samples/s/p 1:21:08 } +2024-07-30 04:48:36,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2809/ 3125], loss: 0.219, per_step_time: 1414ms, lr: 3.136367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:36,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.65546 samples/s/p 1:21:07 } +2024-07-30 04:48:39,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2811/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 3.133162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:39,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.65983 samples/s/p 1:21:00 } +2024-07-30 04:48:42,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2813/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 3.1299573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:42,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.65859 samples/s/p 1:20:59 } +2024-07-30 04:48:45,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2815/ 3125], loss: 0.597, per_step_time: 1414ms, lr: 3.1267534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:45,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.65758 samples/s/p 1:20:57 } +2024-07-30 04:48:48,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2817/ 3125], loss: 0.322, per_step_time: 1415ms, lr: 3.1235509e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:48,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.65258 samples/s/p 1:20:58 } +2024-07-30 04:48:51,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2819/ 3125], loss: 0.286, per_step_time: 1414ms, lr: 3.1203479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:51,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.65747 samples/s/p 1:20:51 } +2024-07-30 04:48:53,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2821/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 3.1171471e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:53,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.66146 samples/s/p 1:20:45 } +2024-07-30 04:48:56,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2823/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 3.1139475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:56,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.65896 samples/s/p 1:20:44 } +2024-07-30 04:48:59,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2825/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 3.110748e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:59,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.66171 samples/s/p 1:20:39 } +2024-07-30 04:49:02,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2827/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 3.1075494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:02,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.66044 samples/s/p 1:20:37 } +2024-07-30 04:49:05,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2829/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 3.1043523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:05,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.66030 samples/s/p 1:20:35 } +2024-07-30 04:49:08,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2831/ 3125], loss: 0.503, per_step_time: 1413ms, lr: 3.1011564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:08,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.65900 samples/s/p 1:20:33 } +2024-07-30 04:49:10,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2833/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 3.0979597e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:10,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.65890 samples/s/p 1:20:30 } +2024-07-30 04:49:13,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2835/ 3125], loss: 0.214, per_step_time: 1418ms, lr: 3.094765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:13,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.63919 samples/s/p 1:20:44 } +2024-07-30 04:49:16,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2837/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 3.0915708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:16,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.66163 samples/s/p 1:20:22 } +2024-07-30 04:49:19,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2839/ 3125], loss: 0.136, per_step_time: 1413ms, lr: 3.0883782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:19,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.66054 samples/s/p 1:20:20 } +2024-07-30 04:49:22,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2841/ 3125], loss: 0.094, per_step_time: 1412ms, lr: 3.0851863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:22,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.66198 samples/s/p 1:20:16 } +2024-07-30 04:49:25,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2843/ 3125], loss: 0.482, per_step_time: 1416ms, lr: 3.0819954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:25,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.64820 samples/s/p 1:20:25 } +2024-07-30 04:49:27,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2845/ 3125], loss: 0.384, per_step_time: 1415ms, lr: 3.0788058e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:27,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.65083 samples/s/p 1:20:20 } +2024-07-30 04:49:30,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2847/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 3.0756155e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:30,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.65799 samples/s/p 1:20:11 } +2024-07-30 04:49:33,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2849/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 3.0724268e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:33,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.65907 samples/s/p 1:20:07 } +2024-07-30 04:49:36,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2851/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 3.0692397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:36,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.65966 samples/s/p 1:20:04 } +2024-07-30 04:49:39,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2853/ 3125], loss: 0.544, per_step_time: 1413ms, lr: 3.0660533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:39,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.65905 samples/s/p 1:20:02 } +2024-07-30 04:49:42,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2855/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 3.062868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:42,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.66149 samples/s/p 1:19:57 } +2024-07-30 04:49:44,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2857/ 3125], loss: 0.390, per_step_time: 1413ms, lr: 3.0596836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:44,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.66023 samples/s/p 1:19:55 } +2024-07-30 04:49:47,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2859/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 3.0564995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:47,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.66073 samples/s/p 1:19:52 } +2024-07-30 04:49:50,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2861/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 3.053317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:50,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.66007 samples/s/p 1:19:50 } +2024-07-30 04:49:53,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2863/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 3.0501344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:53,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.66040 samples/s/p 1:19:46 } +2024-07-30 04:49:56,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2865/ 3125], loss: 0.275, per_step_time: 1412ms, lr: 3.0469537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:56,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.66244 samples/s/p 1:19:42 } +2024-07-30 04:49:59,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2867/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 3.0437736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:59,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.65970 samples/s/p 1:19:41 } +2024-07-30 04:50:01,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2869/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 3.040595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:01,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.66092 samples/s/p 1:19:38 } +2024-07-30 04:50:04,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2871/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 3.0374165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:04,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |███████████████████████████████ | 5.65931 samples/s/p 1:19:36 } +2024-07-30 04:50:07,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2873/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 3.0342396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:07,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |███████████████████████████████ | 5.65687 samples/s/p 1:19:35 } +2024-07-30 04:50:10,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2875/ 3125], loss: 0.374, per_step_time: 1415ms, lr: 3.0310637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:10,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.65060 samples/s/p 1:19:38 } +2024-07-30 04:50:13,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2877/ 3125], loss: 0.305, per_step_time: 1414ms, lr: 3.0278873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:13,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.65719 samples/s/p 1:19:29 } +2024-07-30 04:50:16,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2879/ 3125], loss: 0.043, per_step_time: 1419ms, lr: 3.0247134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:16,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.63403 samples/s/p 1:19:46 } +2024-07-30 04:50:18,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2881/ 3125], loss: 0.512, per_step_time: 1413ms, lr: 3.02154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:18,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.66038 samples/s/p 1:19:21 } +2024-07-30 04:50:21,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2883/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 3.0183671e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:21,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.66107 samples/s/p 1:19:18 } +2024-07-30 04:50:24,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2885/ 3125], loss: 0.169, per_step_time: 1413ms, lr: 3.015196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:24,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.65844 samples/s/p 1:19:17 } +2024-07-30 04:50:27,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2887/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 3.012026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:27,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.66064 samples/s/p 1:19:12 } +2024-07-30 04:50:30,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2889/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 3.008856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:30,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.66036 samples/s/p 1:19:10 } +2024-07-30 04:50:33,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2891/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 3.0056867e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:33,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.66017 samples/s/p 1:19:07 } +2024-07-30 04:50:35,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2893/ 3125], loss: 0.385, per_step_time: 1412ms, lr: 3.0025187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:35,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.66182 samples/s/p 1:19:03 } +2024-07-30 04:50:38,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2895/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 2.999352e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:38,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.65903 samples/s/p 1:19:02 } +2024-07-30 04:50:41,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2897/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 2.9961866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:41,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.65822 samples/s/p 1:19:00 } +2024-07-30 04:50:44,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2899/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 2.9930218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:44,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.65980 samples/s/p 1:18:56 } +2024-07-30 04:50:47,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2901/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 2.9898583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:47,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.66013 samples/s/p 1:18:53 } +2024-07-30 04:50:50,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2903/ 3125], loss: 0.222, per_step_time: 1414ms, lr: 2.9866949e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:50,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.65705 samples/s/p 1:18:53 } +2024-07-30 04:50:52,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2905/ 3125], loss: 0.322, per_step_time: 1413ms, lr: 2.9835319e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:52,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.66030 samples/s/p 1:18:47 } +2024-07-30 04:50:55,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2907/ 3125], loss: 0.115, per_step_time: 1414ms, lr: 2.980371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:55,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.65537 samples/s/p 1:18:48 } +2024-07-30 04:50:58,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2909/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 2.9772114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:58,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.65875 samples/s/p 1:18:43 } +2024-07-30 04:51:01,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2911/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 2.9740524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:01,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.65920 samples/s/p 1:18:40 } +2024-07-30 04:51:04,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2913/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 2.9708945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:04,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.65788 samples/s/p 1:18:38 } +2024-07-30 04:51:07,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2915/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 2.9677371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:07,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.66168 samples/s/p 1:18:32 } +2024-07-30 04:51:09,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2917/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 2.9645812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:09,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.65949 samples/s/p 1:18:31 } +2024-07-30 04:51:12,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2919/ 3125], loss: 0.264, per_step_time: 1415ms, lr: 2.961425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:12,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.65297 samples/s/p 1:18:33 } +2024-07-30 04:51:15,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2921/ 3125], loss: 0.233, per_step_time: 1414ms, lr: 2.958271e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:15,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.65760 samples/s/p 1:18:27 } +2024-07-30 04:51:18,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2923/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 2.9551177e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:18,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.65928 samples/s/p 1:18:23 } +2024-07-30 04:51:21,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2925/ 3125], loss: 0.236, per_step_time: 1412ms, lr: 2.9519658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:21,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.66226 samples/s/p 1:18:17 } +2024-07-30 04:51:24,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2927/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 2.9488142e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:24,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.66018 samples/s/p 1:18:16 } +2024-07-30 04:51:26,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2929/ 3125], loss: 0.236, per_step_time: 1412ms, lr: 2.9456642e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:26,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.66186 samples/s/p 1:18:12 } +2024-07-30 04:51:29,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2931/ 3125], loss: 0.321, per_step_time: 1413ms, lr: 2.942515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:29,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.65988 samples/s/p 1:18:11 } +2024-07-30 04:51:32,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2933/ 3125], loss: 0.302, per_step_time: 1414ms, lr: 2.9393668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:32,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.65763 samples/s/p 1:18:10 } +2024-07-30 04:51:35,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2935/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 2.9362188e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:35,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.65869 samples/s/p 1:18:06 } +2024-07-30 04:51:38,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2937/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 2.9330724e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:38,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.65906 samples/s/p 1:18:03 } +2024-07-30 04:51:41,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2939/ 3125], loss: 0.116, per_step_time: 1413ms, lr: 2.9299267e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:41,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.66160 samples/s/p 1:17:58 } +2024-07-30 04:51:43,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2941/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 2.9267826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:43,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.65776 samples/s/p 1:17:58 } +2024-07-30 04:51:46,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2943/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 2.9236394e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:46,808 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.65904 samples/s/p 1:17:54 } +2024-07-30 04:51:49,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2945/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 2.920497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:49,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.66126 samples/s/p 1:17:50 } +2024-07-30 04:51:52,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2947/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 2.917356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:52,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.65773 samples/s/p 1:17:50 } +2024-07-30 04:51:55,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2949/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 2.9142147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:55,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.66097 samples/s/p 1:17:44 } +2024-07-30 04:51:58,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2951/ 3125], loss: 0.022, per_step_time: 1413ms, lr: 2.9110752e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:58,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.66080 samples/s/p 1:17:42 } +2024-07-30 04:52:00,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2953/ 3125], loss: 0.267, per_step_time: 1414ms, lr: 2.9079372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:00,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.65707 samples/s/p 1:17:42 } +2024-07-30 04:52:03,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2955/ 3125], loss: 0.157, per_step_time: 1412ms, lr: 2.904799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:03,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.66220 samples/s/p 1:17:35 } +2024-07-30 04:52:06,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2957/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 2.9016626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:06,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.66043 samples/s/p 1:17:34 } +2024-07-30 04:52:09,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2959/ 3125], loss: 0.113, per_step_time: 1413ms, lr: 2.8985273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:09,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.65825 samples/s/p 1:17:33 } +2024-07-30 04:52:12,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2961/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 2.8953932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:12,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.66126 samples/s/p 1:17:27 } +2024-07-30 04:52:15,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2963/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 2.8922586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:15,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.65950 samples/s/p 1:17:26 } +2024-07-30 04:52:17,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2965/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 2.8891266e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:17,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.65989 samples/s/p 1:17:23 } +2024-07-30 04:52:20,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2967/ 3125], loss: 0.358, per_step_time: 1414ms, lr: 2.8859954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:20,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.65675 samples/s/p 1:17:22 } +2024-07-30 04:52:23,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2969/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 2.882865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:23,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.65989 samples/s/p 1:17:17 } +2024-07-30 04:52:26,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2971/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 2.8797358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:26,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.65983 samples/s/p 1:17:14 } +2024-07-30 04:52:29,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2973/ 3125], loss: 0.339, per_step_time: 1414ms, lr: 2.8766076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:29,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.65607 samples/s/p 1:17:15 } +2024-07-30 04:52:32,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2975/ 3125], loss: 0.189, per_step_time: 1414ms, lr: 2.8734794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:32,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.65687 samples/s/p 1:17:11 } +2024-07-30 04:52:34,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2977/ 3125], loss: 0.048, per_step_time: 1415ms, lr: 2.8703535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:34,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.65270 samples/s/p 1:17:12 } +2024-07-30 04:52:37,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2979/ 3125], loss: 0.607, per_step_time: 1414ms, lr: 2.867227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:37,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.65529 samples/s/p 1:17:07 } +2024-07-30 04:52:40,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2981/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 2.864103e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:40,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.65958 samples/s/p 1:17:00 } +2024-07-30 04:52:43,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2983/ 3125], loss: 0.097, per_step_time: 1413ms, lr: 2.86098e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:43,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.66084 samples/s/p 1:16:56 } +2024-07-30 04:52:46,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2985/ 3125], loss: 0.277, per_step_time: 1412ms, lr: 2.857858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:46,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.66202 samples/s/p 1:16:53 } +2024-07-30 04:52:49,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2987/ 3125], loss: 0.051, per_step_time: 1413ms, lr: 2.8547367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:49,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.66044 samples/s/p 1:16:51 } +2024-07-30 04:52:52,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2989/ 3125], loss: 0.155, per_step_time: 1444ms, lr: 2.8516167e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:52,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.53955 samples/s/p 1:18:29 } +2024-07-30 04:52:54,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2991/ 3125], loss: 0.142, per_step_time: 1413ms, lr: 2.8484965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:54,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.66046 samples/s/p 1:16:45 } +2024-07-30 04:52:57,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2993/ 3125], loss: 0.114, per_step_time: 1413ms, lr: 2.8453785e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:57,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.65883 samples/s/p 1:16:44 } +2024-07-30 04:53:00,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2995/ 3125], loss: 0.278, per_step_time: 1415ms, lr: 2.8422617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:00,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.65296 samples/s/p 1:16:46 } +2024-07-30 04:53:03,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2997/ 3125], loss: 0.344, per_step_time: 1413ms, lr: 2.8391455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:03,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.65894 samples/s/p 1:16:38 } +2024-07-30 04:53:06,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2999/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 2.8360298e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:06,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.65846 samples/s/p 1:16:36 } +2024-07-30 04:53:09,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3001/ 3125], loss: 0.242, per_step_time: 1414ms, lr: 2.832916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:09,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.65412 samples/s/p 1:16:37 } +2024-07-30 04:53:11,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3003/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 2.8298032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:11,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.65783 samples/s/p 1:16:31 } +2024-07-30 04:53:14,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3005/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 2.8266911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:14,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.65844 samples/s/p 1:16:27 } +2024-07-30 04:53:17,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3007/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 2.8235793e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:17,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.65899 samples/s/p 1:16:24 } +2024-07-30 04:53:20,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3009/ 3125], loss: 0.139, per_step_time: 1413ms, lr: 2.8204697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:20,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.66126 samples/s/p 1:16:19 } +2024-07-30 04:53:23,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3011/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 2.817361e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:23,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.66084 samples/s/p 1:16:17 } +2024-07-30 04:53:26,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3013/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 2.8142535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:26,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.65875 samples/s/p 1:16:16 } +2024-07-30 04:53:28,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3015/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 2.811147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:28,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.66136 samples/s/p 1:16:11 } +2024-07-30 04:53:31,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3017/ 3125], loss: 0.380, per_step_time: 1419ms, lr: 2.8080415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:31,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.63753 samples/s/p 1:16:27 } +2024-07-30 04:53:34,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3019/ 3125], loss: 0.323, per_step_time: 1413ms, lr: 2.8049358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:34,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.65779 samples/s/p 1:16:08 } +2024-07-30 04:53:37,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3021/ 3125], loss: 0.158, per_step_time: 1413ms, lr: 2.8018326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:37,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.65991 samples/s/p 1:16:04 } +2024-07-30 04:53:40,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3023/ 3125], loss: 0.125, per_step_time: 1413ms, lr: 2.798729e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:40,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.65796 samples/s/p 1:16:02 } +2024-07-30 04:53:43,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3025/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 2.7956276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:43,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.66064 samples/s/p 1:15:57 } +2024-07-30 04:53:45,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3027/ 3125], loss: 0.122, per_step_time: 1414ms, lr: 2.7925273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:45,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.65750 samples/s/p 1:15:57 } +2024-07-30 04:53:48,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3029/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 2.7894282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:48,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.65835 samples/s/p 1:15:53 } +2024-07-30 04:53:51,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3031/ 3125], loss: 0.483, per_step_time: 1414ms, lr: 2.78633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:51,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.65501 samples/s/p 1:15:53 } +2024-07-30 04:53:54,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3033/ 3125], loss: 0.305, per_step_time: 1414ms, lr: 2.783233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:54,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.65768 samples/s/p 1:15:48 } +2024-07-30 04:53:57,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3035/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 2.7801354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:57,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.65918 samples/s/p 1:15:44 } +2024-07-30 04:54:00,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3037/ 3125], loss: 0.364, per_step_time: 1415ms, lr: 2.7770404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:00,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.65218 samples/s/p 1:15:47 } +2024-07-30 04:54:02,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3039/ 3125], loss: 0.401, per_step_time: 1413ms, lr: 2.7739466e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:02,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.66058 samples/s/p 1:15:38 } +2024-07-30 04:54:05,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3041/ 3125], loss: 0.106, per_step_time: 1413ms, lr: 2.7708536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:05,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.65884 samples/s/p 1:15:36 } +2024-07-30 04:54:08,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3043/ 3125], loss: 0.102, per_step_time: 1413ms, lr: 2.7677606e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:08,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.66029 samples/s/p 1:15:32 } +2024-07-30 04:54:11,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3045/ 3125], loss: 0.135, per_step_time: 1412ms, lr: 2.7646702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:11,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.66206 samples/s/p 1:15:28 } +2024-07-30 04:54:14,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3047/ 3125], loss: 0.335, per_step_time: 1413ms, lr: 2.7615804e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:14,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.65898 samples/s/p 1:15:28 } +2024-07-30 04:54:17,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3049/ 3125], loss: 0.182, per_step_time: 1412ms, lr: 2.7584906e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:17,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.66252 samples/s/p 1:15:22 } +2024-07-30 04:54:19,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3051/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 2.755403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:19,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.65954 samples/s/p 1:15:21 } +2024-07-30 04:54:22,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3053/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 2.7523165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:22,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.65987 samples/s/p 1:15:18 } +2024-07-30 04:54:25,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3055/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 2.7492315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:25,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.65831 samples/s/p 1:15:17 } +2024-07-30 04:54:28,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3057/ 3125], loss: 0.214, per_step_time: 1414ms, lr: 2.746147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:28,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.65700 samples/s/p 1:15:15 } +2024-07-30 04:54:31,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3059/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 2.7430635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:31,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |████████████████████████████████ | 5.66166 samples/s/p 1:15:08 } +2024-07-30 04:54:34,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3061/ 3125], loss: 0.202, per_step_time: 1414ms, lr: 2.7399817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:34,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |████████████████████████████████ | 5.65770 samples/s/p 1:15:09 } +2024-07-30 04:54:36,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3063/ 3125], loss: 0.301, per_step_time: 1414ms, lr: 2.7368992e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:36,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.65547 samples/s/p 1:15:08 } +2024-07-30 04:54:39,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3065/ 3125], loss: 0.355, per_step_time: 1414ms, lr: 2.7338194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:39,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.65496 samples/s/p 1:15:05 } +2024-07-30 04:54:42,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3067/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 2.7307394e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:42,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.65803 samples/s/p 1:15:00 } +2024-07-30 04:54:45,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3069/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 2.7276617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:45,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.66165 samples/s/p 1:14:54 } +2024-07-30 04:54:48,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3071/ 3125], loss: 0.504, per_step_time: 1414ms, lr: 2.7245849e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:48,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.65766 samples/s/p 1:14:55 } +2024-07-30 04:54:51,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3073/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 2.7215092e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:51,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.65941 samples/s/p 1:14:50 } +2024-07-30 04:54:53,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3075/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 2.7184346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:53,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.66162 samples/s/p 1:14:46 } +2024-07-30 04:54:56,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3077/ 3125], loss: 0.393, per_step_time: 1413ms, lr: 2.715361e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:56,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.65976 samples/s/p 1:14:44 } +2024-07-30 04:54:59,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3079/ 3125], loss: 0.137, per_step_time: 1415ms, lr: 2.7122876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:59,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.65359 samples/s/p 1:14:47 } +2024-07-30 04:55:02,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3081/ 3125], loss: 0.499, per_step_time: 1413ms, lr: 2.709216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:02,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.66038 samples/s/p 1:14:38 } +2024-07-30 04:55:05,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3083/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 2.7061462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:05,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.65919 samples/s/p 1:14:36 } +2024-07-30 04:55:08,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3085/ 3125], loss: 0.230, per_step_time: 1412ms, lr: 2.7030771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:08,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.66203 samples/s/p 1:14:31 } +2024-07-30 04:55:10,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3087/ 3125], loss: 0.280, per_step_time: 1415ms, lr: 2.7000078e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:10,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.64995 samples/s/p 1:14:38 } +2024-07-30 04:55:13,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3089/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 2.6969408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:13,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.66076 samples/s/p 1:14:27 } +2024-07-30 04:55:16,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3091/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 2.6938749e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:16,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.66029 samples/s/p 1:14:24 } +2024-07-30 04:55:19,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3093/ 3125], loss: 0.408, per_step_time: 1414ms, lr: 2.6908092e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:19,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.65747 samples/s/p 1:14:24 } +2024-07-30 04:55:22,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3095/ 3125], loss: 0.365, per_step_time: 1412ms, lr: 2.6877456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:22,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.66177 samples/s/p 1:14:17 } +2024-07-30 04:55:25,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3097/ 3125], loss: 0.169, per_step_time: 1413ms, lr: 2.684683e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:25,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.66013 samples/s/p 1:14:16 } +2024-07-30 04:55:27,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3099/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 2.6816215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:27,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.65955 samples/s/p 1:14:14 } +2024-07-30 04:55:30,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3101/ 3125], loss: 0.268, per_step_time: 1412ms, lr: 2.678561e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:30,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.66193 samples/s/p 1:14:09 } +2024-07-30 04:55:33,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3103/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 2.6755022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:33,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.65798 samples/s/p 1:14:09 } +2024-07-30 04:55:36,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3105/ 3125], loss: 0.380, per_step_time: 1413ms, lr: 2.672444e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:36,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.66165 samples/s/p 1:14:03 } +2024-07-30 04:55:39,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3107/ 3125], loss: 0.395, per_step_time: 1414ms, lr: 2.6693863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:39,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.65735 samples/s/p 1:14:04 } +2024-07-30 04:55:42,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3109/ 3125], loss: 0.345, per_step_time: 1412ms, lr: 2.6663304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:42,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.66284 samples/s/p 1:13:57 } +2024-07-30 04:55:44,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3111/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 2.6632742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:44,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.66035 samples/s/p 1:13:56 } +2024-07-30 04:55:47,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3113/ 3125], loss: 0.202, per_step_time: 1414ms, lr: 2.6602208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:47,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.65413 samples/s/p 1:13:58 } +2024-07-30 04:55:50,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3115/ 3125], loss: 0.219, per_step_time: 1414ms, lr: 2.6571681e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:50,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.65609 samples/s/p 1:13:54 } +2024-07-30 04:55:53,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3117/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 2.6541168e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:53,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.65866 samples/s/p 1:13:49 } +2024-07-30 04:55:56,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3119/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 2.6510663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:56,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.65907 samples/s/p 1:13:46 } +2024-07-30 04:55:59,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3121/ 3125], loss: 0.329, per_step_time: 1412ms, lr: 2.648016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:59,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.66224 samples/s/p 1:13:40 } +2024-07-30 04:56:01,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3123/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 2.644968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:01,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.65822 samples/s/p 1:13:41 } +2024-07-30 04:56:04,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3125/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 2.641921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:04,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.65993 samples/s/p 1:13:37 } +2024-07-30 04:56:07,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2/ 3125], loss: 0.264, per_step_time: 1414ms, lr: 2.6388755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:07,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.65715 samples/s/p 1:13:36 } +2024-07-30 04:56:10,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 4/ 3125], loss: 0.209, per_step_time: 1414ms, lr: 2.6358305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:10,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.65742 samples/s/p 1:13:33 } +2024-07-30 04:56:13,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 6/ 3125], loss: 0.401, per_step_time: 1413ms, lr: 2.632786e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:13,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.65802 samples/s/p 1:13:30 } +2024-07-30 04:56:16,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 8/ 3125], loss: 0.274, per_step_time: 1412ms, lr: 2.6297437e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:16,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.66196 samples/s/p 1:13:24 } +2024-07-30 04:56:18,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 10/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 2.6267028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:18,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.65494 samples/s/p 1:13:26 } +2024-07-30 04:56:21,807 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 12/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 2.6236612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:21,808 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.65647 samples/s/p 1:13:22 } +2024-07-30 04:56:24,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 14/ 3125], loss: 0.251, per_step_time: 1414ms, lr: 2.6206224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:24,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.65415 samples/s/p 1:13:21 } +2024-07-30 04:56:27,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 16/ 3125], loss: 0.254, per_step_time: 1414ms, lr: 2.6175844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:27,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.65415 samples/s/p 1:13:18 } +2024-07-30 04:56:30,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 18/ 3125], loss: 0.416, per_step_time: 1413ms, lr: 2.6145476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:30,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.66035 samples/s/p 1:13:11 } +2024-07-30 04:56:33,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 20/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 2.6115122e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:33,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.66027 samples/s/p 1:13:08 } +2024-07-30 04:56:35,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 22/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 2.6084776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:35,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.65916 samples/s/p 1:13:06 } +2024-07-30 04:56:38,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 24/ 3125], loss: 0.292, per_step_time: 1413ms, lr: 2.6054445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:38,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.65982 samples/s/p 1:13:03 } +2024-07-30 04:56:41,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 26/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 2.6024115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:41,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.65974 samples/s/p 1:13:00 } +2024-07-30 04:56:44,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 28/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 2.5993802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:44,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.66000 samples/s/p 1:12:57 } +2024-07-30 04:56:47,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 30/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 2.5963493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:47,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.66113 samples/s/p 1:12:53 } +2024-07-30 04:56:50,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 32/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 2.5933205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:50,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.66035 samples/s/p 1:12:51 } +2024-07-30 04:56:52,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 34/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 2.5902932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:52,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.66150 samples/s/p 1:12:47 } +2024-07-30 04:56:55,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 36/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 2.5872669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:55,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.66138 samples/s/p 1:12:45 } +2024-07-30 04:56:58,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 38/ 3125], loss: 0.348, per_step_time: 1413ms, lr: 2.5842417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:58,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.66029 samples/s/p 1:12:43 } +2024-07-30 04:57:01,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 40/ 3125], loss: 0.229, per_step_time: 1412ms, lr: 2.581216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:01,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.66243 samples/s/p 1:12:38 } +2024-07-30 04:57:04,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 42/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 2.5781935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:04,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.65886 samples/s/p 1:12:38 } +2024-07-30 04:57:07,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 44/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 2.5751715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:07,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.66047 samples/s/p 1:12:34 } +2024-07-30 04:57:09,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 46/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 2.5721508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:09,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.66077 samples/s/p 1:12:31 } +2024-07-30 04:57:12,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 48/ 3125], loss: 0.220, per_step_time: 1414ms, lr: 2.569131e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:12,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.65721 samples/s/p 1:12:31 } +2024-07-30 04:57:15,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 50/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 2.5661127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:15,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.66019 samples/s/p 1:12:26 } +2024-07-30 04:57:18,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 52/ 3125], loss: 0.283, per_step_time: 1412ms, lr: 2.5630948e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:18,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.66188 samples/s/p 1:12:22 } +2024-07-30 04:57:21,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 54/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 2.5600777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:21,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.66110 samples/s/p 1:12:19 } +2024-07-30 04:57:24,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 56/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 2.557063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:24,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.65952 samples/s/p 1:12:18 } +2024-07-30 04:57:26,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 58/ 3125], loss: 0.320, per_step_time: 1413ms, lr: 2.5540494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:26,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.65959 samples/s/p 1:12:15 } +2024-07-30 04:57:29,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 60/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 2.5510367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:29,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.65873 samples/s/p 1:12:13 } +2024-07-30 04:57:32,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 62/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 2.5480251e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:32,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.65958 samples/s/p 1:12:09 } +2024-07-30 04:57:35,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 64/ 3125], loss: 0.206, per_step_time: 1412ms, lr: 2.5450151e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:35,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.66195 samples/s/p 1:12:05 } +2024-07-30 04:57:38,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 66/ 3125], loss: 0.249, per_step_time: 1414ms, lr: 2.5420063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:38,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.65765 samples/s/p 1:12:05 } +2024-07-30 04:57:41,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 68/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 2.5389975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:41,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.66164 samples/s/p 1:11:59 } +2024-07-30 04:57:43,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 70/ 3125], loss: 0.317, per_step_time: 1412ms, lr: 2.5359905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:43,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.66232 samples/s/p 1:11:56 } +2024-07-30 04:57:46,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 72/ 3125], loss: 0.413, per_step_time: 1414ms, lr: 2.532985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:46,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.65629 samples/s/p 1:11:58 } +2024-07-30 04:57:49,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 74/ 3125], loss: 0.082, per_step_time: 1413ms, lr: 2.529981e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:49,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.65908 samples/s/p 1:11:53 } +2024-07-30 04:57:52,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 76/ 3125], loss: 0.412, per_step_time: 1414ms, lr: 2.5269765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:52,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.65681 samples/s/p 1:11:51 } +2024-07-30 04:57:55,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 78/ 3125], loss: 0.093, per_step_time: 1414ms, lr: 2.5239747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:55,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.65693 samples/s/p 1:11:49 } +2024-07-30 04:57:58,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 80/ 3125], loss: 0.102, per_step_time: 1413ms, lr: 2.5209742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:58,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.66125 samples/s/p 1:11:42 } +2024-07-30 04:58:00,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 82/ 3125], loss: 0.208, per_step_time: 1414ms, lr: 2.5179743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:00,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.65403 samples/s/p 1:11:45 } +2024-07-30 04:58:03,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 84/ 3125], loss: 0.203, per_step_time: 1412ms, lr: 2.514975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:03,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.66264 samples/s/p 1:11:36 } +2024-07-30 04:58:06,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 86/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 2.5119778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:06,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.66037 samples/s/p 1:11:35 } +2024-07-30 04:58:09,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 88/ 3125], loss: 0.132, per_step_time: 1414ms, lr: 2.5089817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:09,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.65522 samples/s/p 1:11:36 } +2024-07-30 04:58:12,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 90/ 3125], loss: 0.296, per_step_time: 1415ms, lr: 2.505987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:12,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.65367 samples/s/p 1:11:34 } +2024-07-30 04:58:15,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 92/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 2.5029933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:15,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.66166 samples/s/p 1:11:25 } +2024-07-30 04:58:18,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 94/ 3125], loss: 0.059, per_step_time: 1413ms, lr: 2.5000008e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:18,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.65800 samples/s/p 1:11:25 } +2024-07-30 04:58:20,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 96/ 3125], loss: 0.201, per_step_time: 1414ms, lr: 2.4970086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:20,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.65525 samples/s/p 1:11:24 } +2024-07-30 04:58:23,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 98/ 3125], loss: 0.089, per_step_time: 1413ms, lr: 2.4940175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:23,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.66092 samples/s/p 1:11:17 } +2024-07-30 04:58:26,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 100/ 3125], loss: 0.347, per_step_time: 1412ms, lr: 2.4910285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:26,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.66212 samples/s/p 1:11:14 } +2024-07-30 04:58:29,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 102/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 2.4880408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:29,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.66049 samples/s/p 1:11:12 } +2024-07-30 04:58:32,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 104/ 3125], loss: 0.186, per_step_time: 1414ms, lr: 2.4850544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:32,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.65578 samples/s/p 1:11:13 } +2024-07-30 04:58:35,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 106/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 2.4820695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:35,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.65915 samples/s/p 1:11:07 } +2024-07-30 04:58:37,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 108/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 2.4790852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:37,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.65900 samples/s/p 1:11:05 } +2024-07-30 04:58:40,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 110/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 2.4761023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:40,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.66059 samples/s/p 1:11:01 } +2024-07-30 04:58:43,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 112/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 2.4731198e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:43,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.65792 samples/s/p 1:11:00 } +2024-07-30 04:58:46,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 114/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 2.4701392e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:46,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.66001 samples/s/p 1:10:55 } +2024-07-30 04:58:49,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 116/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 2.46716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:49,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.66051 samples/s/p 1:10:52 } +2024-07-30 04:58:52,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 118/ 3125], loss: 0.344, per_step_time: 1413ms, lr: 2.464182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:52,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.66007 samples/s/p 1:10:50 } +2024-07-30 04:58:54,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 120/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 2.461204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:54,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.66074 samples/s/p 1:10:46 } +2024-07-30 04:58:57,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 122/ 3125], loss: 0.334, per_step_time: 1413ms, lr: 2.4582287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:57,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |█████████████████████████████████ | 5.66003 samples/s/p 1:10:44 } +2024-07-30 04:59:00,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 124/ 3125], loss: 0.114, per_step_time: 1413ms, lr: 2.4552542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:00,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |█████████████████████████████████ | 5.65854 samples/s/p 1:10:42 } +2024-07-30 04:59:03,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 126/ 3125], loss: 0.214, per_step_time: 1412ms, lr: 2.45228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:03,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.66198 samples/s/p 1:10:37 } +2024-07-30 04:59:06,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 128/ 3125], loss: 0.396, per_step_time: 1415ms, lr: 2.4493079e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:06,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.65230 samples/s/p 1:10:41 } +2024-07-30 04:59:09,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 130/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 2.4463372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:09,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.66066 samples/s/p 1:10:32 } +2024-07-30 04:59:11,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 132/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 2.4433677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:11,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.65999 samples/s/p 1:10:30 } +2024-07-30 04:59:14,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 134/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 2.4403994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:14,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.65949 samples/s/p 1:10:27 } +2024-07-30 04:59:17,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 136/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 2.4374324e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:17,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.66012 samples/s/p 1:10:24 } +2024-07-30 04:59:20,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 138/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 2.4344665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:20,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.65993 samples/s/p 1:10:21 } +2024-07-30 04:59:23,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 140/ 3125], loss: 0.139, per_step_time: 1414ms, lr: 2.431501e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:23,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.65626 samples/s/p 1:10:21 } +2024-07-30 04:59:26,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 142/ 3125], loss: 0.400, per_step_time: 1413ms, lr: 2.4285375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:26,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.66046 samples/s/p 1:10:15 } +2024-07-30 04:59:28,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 144/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 2.4255744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:28,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.66118 samples/s/p 1:10:12 } +2024-07-30 04:59:31,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 146/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 2.422613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:31,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.66035 samples/s/p 1:10:10 } +2024-07-30 04:59:34,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 148/ 3125], loss: 0.408, per_step_time: 1414ms, lr: 2.4196536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:34,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.65445 samples/s/p 1:10:11 } +2024-07-30 04:59:37,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 150/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 2.416695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:37,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.65803 samples/s/p 1:10:06 } +2024-07-30 04:59:40,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 152/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 2.413738e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:40,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.66114 samples/s/p 1:10:01 } +2024-07-30 04:59:43,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 154/ 3125], loss: 0.100, per_step_time: 1413ms, lr: 2.410782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:43,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.65822 samples/s/p 1:10:00 } +2024-07-30 04:59:45,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 156/ 3125], loss: 0.267, per_step_time: 1419ms, lr: 2.407826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:45,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.63524 samples/s/p 1:10:14 } +2024-07-30 04:59:48,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 158/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 2.4048725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:48,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.66163 samples/s/p 1:09:52 } +2024-07-30 04:59:51,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 160/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 2.4019203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:51,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.65998 samples/s/p 1:09:50 } +2024-07-30 04:59:54,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 162/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 2.3989692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:54,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.65905 samples/s/p 1:09:48 } +2024-07-30 04:59:57,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 164/ 3125], loss: 0.320, per_step_time: 1413ms, lr: 2.396018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:57,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.66093 samples/s/p 1:09:44 } +2024-07-30 05:00:00,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 166/ 3125], loss: 0.197, per_step_time: 1414ms, lr: 2.3930697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:00,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.65760 samples/s/p 1:09:44 } +2024-07-30 05:00:02,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 168/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 2.3901223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:02,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.65796 samples/s/p 1:09:41 } +2024-07-30 05:00:05,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 170/ 3125], loss: 0.350, per_step_time: 1417ms, lr: 2.3871753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:05,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.64557 samples/s/p 1:09:47 } +2024-07-30 05:00:08,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 172/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 2.3842304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:08,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.65940 samples/s/p 1:09:34 } +2024-07-30 05:00:11,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 174/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 2.3812868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:11,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.66029 samples/s/p 1:09:30 } +2024-07-30 05:00:14,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 176/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 2.3783446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:14,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.66003 samples/s/p 1:09:28 } +2024-07-30 05:00:17,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 178/ 3125], loss: 0.348, per_step_time: 1414ms, lr: 2.3754033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:17,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.65689 samples/s/p 1:09:27 } +2024-07-30 05:00:19,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 180/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 2.3724635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:19,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.65777 samples/s/p 1:09:24 } +2024-07-30 05:00:22,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 182/ 3125], loss: 0.320, per_step_time: 1414ms, lr: 2.369525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:22,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.65694 samples/s/p 1:09:21 } +2024-07-30 05:00:25,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 184/ 3125], loss: 0.459, per_step_time: 1414ms, lr: 2.3665866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:25,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.65573 samples/s/p 1:09:20 } +2024-07-30 05:00:28,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 186/ 3125], loss: 0.228, per_step_time: 1414ms, lr: 2.3636508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:28,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.65723 samples/s/p 1:09:16 } +2024-07-30 05:00:31,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 188/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 2.360715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:31,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.66112 samples/s/p 1:09:10 } +2024-07-30 05:00:34,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 190/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 2.357781e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:34,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.66135 samples/s/p 1:09:07 } +2024-07-30 05:00:36,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 192/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 2.354849e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:36,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.66046 samples/s/p 1:09:05 } +2024-07-30 05:00:39,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 194/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 2.3519178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:39,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.65784 samples/s/p 1:09:04 } +2024-07-30 05:00:42,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 196/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 2.348988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:42,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.66105 samples/s/p 1:08:59 } +2024-07-30 05:00:45,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 198/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 2.3460586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:45,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.66096 samples/s/p 1:08:56 } +2024-07-30 05:00:48,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 200/ 3125], loss: 0.300, per_step_time: 1412ms, lr: 2.3431312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:48,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.66237 samples/s/p 1:08:52 } +2024-07-30 05:00:51,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 202/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 2.3402056e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:51,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.65841 samples/s/p 1:08:52 } +2024-07-30 05:00:53,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 204/ 3125], loss: 0.330, per_step_time: 1413ms, lr: 2.3372806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:53,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.66055 samples/s/p 1:08:48 } +2024-07-30 05:00:56,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 206/ 3125], loss: 0.396, per_step_time: 1413ms, lr: 2.3343575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:56,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.66077 samples/s/p 1:08:45 } +2024-07-30 05:00:59,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 208/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 2.3314344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:59,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.66081 samples/s/p 1:08:42 } +2024-07-30 05:01:02,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 210/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 2.3285136e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:02,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.66147 samples/s/p 1:08:39 } +2024-07-30 05:01:05,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 212/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 2.3255939e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:05,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.65799 samples/s/p 1:08:38 } +2024-07-30 05:01:08,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 214/ 3125], loss: 0.473, per_step_time: 1413ms, lr: 2.3226744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:08,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.65909 samples/s/p 1:08:35 } +2024-07-30 05:01:10,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 216/ 3125], loss: 0.241, per_step_time: 1415ms, lr: 2.3197572e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:10,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.65243 samples/s/p 1:08:37 } +2024-07-30 05:01:13,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 218/ 3125], loss: 0.399, per_step_time: 1416ms, lr: 2.3168413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:13,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.64788 samples/s/p 1:08:37 } +2024-07-30 05:01:16,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 220/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 2.313927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:16,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.65911 samples/s/p 1:08:26 } +2024-07-30 05:01:19,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 222/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 2.311014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:19,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.65912 samples/s/p 1:08:23 } +2024-07-30 05:01:22,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 224/ 3125], loss: 0.213, per_step_time: 1412ms, lr: 2.3081018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:22,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.66179 samples/s/p 1:08:19 } +2024-07-30 05:01:25,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 226/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 2.3051914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:25,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.65925 samples/s/p 1:08:18 } +2024-07-30 05:01:27,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 228/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 2.3022812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:27,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.65973 samples/s/p 1:08:14 } +2024-07-30 05:01:30,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 230/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 2.2993727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:30,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.66047 samples/s/p 1:08:11 } +2024-07-30 05:01:33,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 232/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 2.2964653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:33,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.66049 samples/s/p 1:08:08 } +2024-07-30 05:01:36,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 234/ 3125], loss: 0.231, per_step_time: 1415ms, lr: 2.2935599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:36,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.65340 samples/s/p 1:08:10 } +2024-07-30 05:01:39,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 236/ 3125], loss: 0.349, per_step_time: 1413ms, lr: 2.2906556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:39,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.66095 samples/s/p 1:08:02 } +2024-07-30 05:01:42,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 238/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 2.287753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:42,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.65804 samples/s/p 1:08:01 } +2024-07-30 05:01:44,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 240/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 2.284851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:44,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.66122 samples/s/p 1:07:56 } +2024-07-30 05:01:47,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 242/ 3125], loss: 0.152, per_step_time: 1414ms, lr: 2.2819497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:47,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.65425 samples/s/p 1:07:59 } +2024-07-30 05:01:50,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 244/ 3125], loss: 0.308, per_step_time: 1414ms, lr: 2.279051e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:50,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.65644 samples/s/p 1:07:54 } +2024-07-30 05:01:53,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 246/ 3125], loss: 0.103, per_step_time: 1413ms, lr: 2.2761533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:53,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.66032 samples/s/p 1:07:49 } +2024-07-30 05:01:56,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 248/ 3125], loss: 0.120, per_step_time: 1414ms, lr: 2.2732568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:56,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.65648 samples/s/p 1:07:48 } +2024-07-30 05:01:59,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 250/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 2.2703616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:59,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.65983 samples/s/p 1:07:43 } +2024-07-30 05:02:01,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 252/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 2.2674667e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:01,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.66032 samples/s/p 1:07:40 } +2024-07-30 05:02:04,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 254/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 2.2645745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:04,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.65931 samples/s/p 1:07:38 } +2024-07-30 05:02:07,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 256/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 2.261682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:07,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.65872 samples/s/p 1:07:36 } +2024-07-30 05:02:10,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 258/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 2.2587922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:10,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.65938 samples/s/p 1:07:32 } +2024-07-30 05:02:13,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 260/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 2.2559038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:13,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.66160 samples/s/p 1:07:28 } +2024-07-30 05:02:16,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 262/ 3125], loss: 0.442, per_step_time: 1414ms, lr: 2.2530164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:16,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.65482 samples/s/p 1:07:30 } +2024-07-30 05:02:18,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 264/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 2.2501304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:18,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.65848 samples/s/p 1:07:24 } +2024-07-30 05:02:21,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 266/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 2.247246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:21,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.66040 samples/s/p 1:07:20 } +2024-07-30 05:02:24,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 268/ 3125], loss: 0.131, per_step_time: 1414ms, lr: 2.2443626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:24,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.65712 samples/s/p 1:07:20 } +2024-07-30 05:02:27,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 270/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 2.2414795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:27,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.65998 samples/s/p 1:07:15 } +2024-07-30 05:02:30,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 272/ 3125], loss: 0.448, per_step_time: 1413ms, lr: 2.2385987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:30,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.66009 samples/s/p 1:07:12 } +2024-07-30 05:02:33,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 274/ 3125], loss: 0.139, per_step_time: 1413ms, lr: 2.2357194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:33,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.66043 samples/s/p 1:07:09 } +2024-07-30 05:02:35,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 276/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 2.2328406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:35,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.66105 samples/s/p 1:07:06 } +2024-07-30 05:02:38,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 278/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 2.2299637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:38,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.65962 samples/s/p 1:07:04 } +2024-07-30 05:02:41,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 280/ 3125], loss: 0.103, per_step_time: 1412ms, lr: 2.2270885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:41,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.66298 samples/s/p 1:06:59 } +2024-07-30 05:02:44,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 282/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 2.2242143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:44,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.65919 samples/s/p 1:06:58 } +2024-07-30 05:02:47,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 284/ 3125], loss: 0.123, per_step_time: 1413ms, lr: 2.2213417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:47,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.65986 samples/s/p 1:06:55 } +2024-07-30 05:02:50,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 286/ 3125], loss: 0.452, per_step_time: 1413ms, lr: 2.218469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:50,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.66026 samples/s/p 1:06:52 } +2024-07-30 05:02:52,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 288/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 2.2155987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:52,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.66112 samples/s/p 1:06:49 } +2024-07-30 05:02:55,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 290/ 3125], loss: 0.319, per_step_time: 1414ms, lr: 2.21273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:55,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.65385 samples/s/p 1:06:51 } +2024-07-30 05:02:58,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 292/ 3125], loss: 0.234, per_step_time: 1414ms, lr: 2.2098627e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:58,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.65547 samples/s/p 1:06:47 } +2024-07-30 05:03:01,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 294/ 3125], loss: 0.413, per_step_time: 1413ms, lr: 2.2069967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:01,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.66101 samples/s/p 1:06:40 } +2024-07-30 05:03:04,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 296/ 3125], loss: 0.140, per_step_time: 1412ms, lr: 2.2041309e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:04,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.66263 samples/s/p 1:06:36 } +2024-07-30 05:03:07,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 298/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 2.2012675e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:07,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.65975 samples/s/p 1:06:35 } +2024-07-30 05:03:09,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 300/ 3125], loss: 0.222, per_step_time: 1412ms, lr: 2.1984042e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:09,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.66236 samples/s/p 1:06:31 } +2024-07-30 05:03:12,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 302/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 2.1955436e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:12,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.66072 samples/s/p 1:06:29 } +2024-07-30 05:03:15,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 304/ 3125], loss: 0.106, per_step_time: 1413ms, lr: 2.192684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:15,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.65827 samples/s/p 1:06:28 } +2024-07-30 05:03:18,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 306/ 3125], loss: 0.305, per_step_time: 1416ms, lr: 2.189826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:18,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.64800 samples/s/p 1:06:32 } +2024-07-30 05:03:21,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 308/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 2.1869691e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:21,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.66125 samples/s/p 1:06:20 } +2024-07-30 05:03:24,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 310/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 2.1841138e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:24,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.66042 samples/s/p 1:06:18 } +2024-07-30 05:03:26,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 312/ 3125], loss: 0.106, per_step_time: 1414ms, lr: 2.18126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:26,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.65704 samples/s/p 1:06:18 } +2024-07-30 05:03:29,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 314/ 3125], loss: 0.510, per_step_time: 1414ms, lr: 2.178406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:29,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |███████████████████████████████████ | 5.65610 samples/s/p 1:06:15 } +2024-07-30 05:03:32,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 316/ 3125], loss: 0.227, per_step_time: 1414ms, lr: 2.175555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:32,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |███████████████████████████████████ | 5.65683 samples/s/p 1:06:12 } +2024-07-30 05:03:35,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 318/ 3125], loss: 0.397, per_step_time: 1413ms, lr: 2.1727046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:35,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.66064 samples/s/p 1:06:07 } +2024-07-30 05:03:38,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 320/ 3125], loss: 0.451, per_step_time: 1412ms, lr: 2.1698552e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:38,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.66230 samples/s/p 1:06:03 } +2024-07-30 05:03:41,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 322/ 3125], loss: 0.272, per_step_time: 1414ms, lr: 2.1670078e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:41,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.65562 samples/s/p 1:06:04 } +2024-07-30 05:03:43,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 324/ 3125], loss: 0.444, per_step_time: 1413ms, lr: 2.1641617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:43,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.65993 samples/s/p 1:05:59 } +2024-07-30 05:03:46,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 326/ 3125], loss: 0.186, per_step_time: 1414ms, lr: 2.161317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:46,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.65770 samples/s/p 1:05:57 } +2024-07-30 05:03:49,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 328/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 2.158473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:49,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.66146 samples/s/p 1:05:52 } +2024-07-30 05:03:52,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 330/ 3125], loss: 0.258, per_step_time: 1412ms, lr: 2.1556311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:52,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.66342 samples/s/p 1:05:48 } +2024-07-30 05:03:55,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 332/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 2.1527903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:55,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.66110 samples/s/p 1:05:46 } +2024-07-30 05:03:58,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 334/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 2.1499513e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:58,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.65984 samples/s/p 1:05:44 } +2024-07-30 05:04:00,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 336/ 3125], loss: 0.485, per_step_time: 1413ms, lr: 2.1471137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:00,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.66077 samples/s/p 1:05:41 } +2024-07-30 05:04:03,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 338/ 3125], loss: 0.426, per_step_time: 1413ms, lr: 2.144277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:03,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.65841 samples/s/p 1:05:40 } +2024-07-30 05:04:06,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 340/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 2.141441e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:06,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.65917 samples/s/p 1:05:36 } +2024-07-30 05:04:09,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 342/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 2.1386072e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:09,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.66134 samples/s/p 1:05:32 } +2024-07-30 05:04:12,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 344/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 2.135774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:12,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.65880 samples/s/p 1:05:31 } +2024-07-30 05:04:15,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 346/ 3125], loss: 0.262, per_step_time: 1414ms, lr: 2.1329429e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:15,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.65548 samples/s/p 1:05:31 } +2024-07-30 05:04:17,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 348/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 2.1301134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:17,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.65776 samples/s/p 1:05:26 } +2024-07-30 05:04:20,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 350/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 2.127285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:20,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.65796 samples/s/p 1:05:23 } +2024-07-30 05:04:23,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 352/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 2.1244582e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:23,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.66099 samples/s/p 1:05:18 } +2024-07-30 05:04:26,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 354/ 3125], loss: 0.058, per_step_time: 1413ms, lr: 2.1216326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:26,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.65977 samples/s/p 1:05:16 } +2024-07-30 05:04:29,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 356/ 3125], loss: 0.377, per_step_time: 1413ms, lr: 2.1188087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:29,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.66098 samples/s/p 1:05:13 } +2024-07-30 05:04:32,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 358/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 2.115985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:32,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.66001 samples/s/p 1:05:10 } +2024-07-30 05:04:34,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 360/ 3125], loss: 0.197, per_step_time: 1414ms, lr: 2.1131634e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:34,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.65730 samples/s/p 1:05:09 } +2024-07-30 05:04:37,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 362/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 2.1103435e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:37,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.65949 samples/s/p 1:05:05 } +2024-07-30 05:04:40,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 364/ 3125], loss: 0.402, per_step_time: 1425ms, lr: 2.1075239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:40,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.61076 samples/s/p 1:05:36 } +2024-07-30 05:04:43,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 366/ 3125], loss: 0.134, per_step_time: 1412ms, lr: 2.1047065e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:43,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.66193 samples/s/p 1:04:58 } +2024-07-30 05:04:46,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 368/ 3125], loss: 0.405, per_step_time: 1412ms, lr: 2.1018907e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:46,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.66207 samples/s/p 1:04:55 } +2024-07-30 05:04:49,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 370/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 2.0990763e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:49,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.66081 samples/s/p 1:04:53 } +2024-07-30 05:04:51,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 372/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 2.0962623e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:51,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.66167 samples/s/p 1:04:50 } +2024-07-30 05:04:54,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 374/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 2.0934503e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:54,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.66064 samples/s/p 1:04:47 } +2024-07-30 05:04:57,660 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 376/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 2.09064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:57,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.66050 samples/s/p 1:04:45 } +2024-07-30 05:05:00,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 378/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 2.087831e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:00,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.66104 samples/s/p 1:04:41 } +2024-07-30 05:05:03,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 380/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 2.0850239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:03,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.65827 samples/s/p 1:04:41 } +2024-07-30 05:05:06,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 382/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 2.0822176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:06,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.65932 samples/s/p 1:04:37 } +2024-07-30 05:05:08,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 384/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 2.079413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:08,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.65985 samples/s/p 1:04:34 } +2024-07-30 05:05:11,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 386/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 2.076608e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:11,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.65780 samples/s/p 1:04:32 } +2024-07-30 05:05:14,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 388/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 2.0738055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:14,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.65803 samples/s/p 1:04:29 } +2024-07-30 05:05:17,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 390/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 2.0710047e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:17,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.65969 samples/s/p 1:04:25 } +2024-07-30 05:05:20,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 392/ 3125], loss: 0.240, per_step_time: 1414ms, lr: 2.0682057e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:20,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.65636 samples/s/p 1:04:25 } +2024-07-30 05:05:23,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 394/ 3125], loss: 0.306, per_step_time: 1416ms, lr: 2.065408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:23,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.64771 samples/s/p 1:04:28 } +2024-07-30 05:05:26,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 396/ 3125], loss: 0.127, per_step_time: 1413ms, lr: 2.0626114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:26,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.65853 samples/s/p 1:04:18 } +2024-07-30 05:05:28,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 398/ 3125], loss: 0.328, per_step_time: 1414ms, lr: 2.0598168e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:28,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.65700 samples/s/p 1:04:16 } +2024-07-30 05:05:31,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 400/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 2.0570221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:31,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.65992 samples/s/p 1:04:11 } +2024-07-30 05:05:34,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 402/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 2.05423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:34,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.66055 samples/s/p 1:04:08 } +2024-07-30 05:05:37,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 404/ 3125], loss: 0.255, per_step_time: 1412ms, lr: 2.051439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:37,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.66232 samples/s/p 1:04:04 } +2024-07-30 05:05:40,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 406/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 2.0486498e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:40,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.66171 samples/s/p 1:04:01 } +2024-07-30 05:05:43,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 408/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 2.0458617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:43,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.66118 samples/s/p 1:03:59 } +2024-07-30 05:05:45,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 410/ 3125], loss: 0.260, per_step_time: 1412ms, lr: 2.0430743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:45,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.66231 samples/s/p 1:03:55 } +2024-07-30 05:05:48,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 412/ 3125], loss: 0.390, per_step_time: 1415ms, lr: 2.0402892e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:48,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.65286 samples/s/p 1:03:59 } +2024-07-30 05:05:51,513 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 414/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 2.0375046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:51,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.65995 samples/s/p 1:03:51 } +2024-07-30 05:05:54,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 416/ 3125], loss: 0.178, per_step_time: 1412ms, lr: 2.0347222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:54,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.66188 samples/s/p 1:03:47 } +2024-07-30 05:05:57,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 418/ 3125], loss: 0.521, per_step_time: 1413ms, lr: 2.0319414e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:57,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.65870 samples/s/p 1:03:47 } +2024-07-30 05:06:00,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 420/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 2.029162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:00,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.66036 samples/s/p 1:03:43 } +2024-07-30 05:06:02,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 422/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 2.0263842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:02,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.66037 samples/s/p 1:03:40 } +2024-07-30 05:06:05,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 424/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 2.023607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:05,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.65881 samples/s/p 1:03:38 } +2024-07-30 05:06:08,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 426/ 3125], loss: 0.164, per_step_time: 1413ms, lr: 2.0208322e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:08,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.65866 samples/s/p 1:03:35 } +2024-07-30 05:06:11,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 428/ 3125], loss: 0.118, per_step_time: 1413ms, lr: 2.0180582e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:11,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.65865 samples/s/p 1:03:32 } +2024-07-30 05:06:14,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 430/ 3125], loss: 0.393, per_step_time: 1414ms, lr: 2.0152852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:14,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.65673 samples/s/p 1:03:31 } +2024-07-30 05:06:17,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 432/ 3125], loss: 0.254, per_step_time: 1415ms, lr: 2.0125142e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:17,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.65225 samples/s/p 1:03:31 } +2024-07-30 05:06:19,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 434/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 2.0097436e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:19,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.66067 samples/s/p 1:03:23 } +2024-07-30 05:06:22,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 436/ 3125], loss: 0.236, per_step_time: 1412ms, lr: 2.0069756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:22,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.66202 samples/s/p 1:03:19 } +2024-07-30 05:06:25,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 438/ 3125], loss: 0.169, per_step_time: 1413ms, lr: 2.0042091e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:25,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.66148 samples/s/p 1:03:16 } +2024-07-30 05:06:28,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 440/ 3125], loss: 0.332, per_step_time: 1414ms, lr: 2.0014438e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:28,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.65637 samples/s/p 1:03:17 } +2024-07-30 05:06:31,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 442/ 3125], loss: 0.359, per_step_time: 1414ms, lr: 1.9986799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:31,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.65692 samples/s/p 1:03:14 } +2024-07-30 05:06:34,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 444/ 3125], loss: 0.249, per_step_time: 1414ms, lr: 1.9959166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:34,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.65700 samples/s/p 1:03:11 } +2024-07-30 05:06:36,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 446/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 1.9931558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:36,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.65981 samples/s/p 1:03:06 } +2024-07-30 05:06:39,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 448/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 1.9903964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:39,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.65967 samples/s/p 1:03:03 } +2024-07-30 05:06:42,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 450/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 1.9876384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:42,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.66072 samples/s/p 1:03:00 } +2024-07-30 05:06:45,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 452/ 3125], loss: 0.185, per_step_time: 1412ms, lr: 1.9848817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:45,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.66281 samples/s/p 1:02:56 } +2024-07-30 05:06:48,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 454/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 1.9821257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:48,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.65984 samples/s/p 1:02:55 } +2024-07-30 05:06:51,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 456/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 1.9793717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:51,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.66082 samples/s/p 1:02:51 } +2024-07-30 05:06:53,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 458/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 1.9766185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:53,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.65855 samples/s/p 1:02:50 } +2024-07-30 05:06:56,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 460/ 3125], loss: 0.338, per_step_time: 1415ms, lr: 1.9738677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:56,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.65340 samples/s/p 1:02:51 } +2024-07-30 05:06:59,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 462/ 3125], loss: 0.385, per_step_time: 1413ms, lr: 1.9711183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:59,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.65776 samples/s/p 1:02:45 } +2024-07-30 05:07:02,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 464/ 3125], loss: 0.441, per_step_time: 1413ms, lr: 1.9683703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:02,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.65887 samples/s/p 1:02:41 } +2024-07-30 05:07:05,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 466/ 3125], loss: 0.331, per_step_time: 1414ms, lr: 1.965624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:05,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.65641 samples/s/p 1:02:40 } +2024-07-30 05:07:08,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 468/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 1.962879e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:08,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.65991 samples/s/p 1:02:35 } +2024-07-30 05:07:10,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 470/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 1.9601353e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:10,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.65843 samples/s/p 1:02:33 } +2024-07-30 05:07:13,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 472/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 1.9573924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:13,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.65801 samples/s/p 1:02:31 } +2024-07-30 05:07:16,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 474/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 1.9546515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:16,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.66040 samples/s/p 1:02:26 } +2024-07-30 05:07:19,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 476/ 3125], loss: 0.248, per_step_time: 1412ms, lr: 1.9519123e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:19,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.66184 samples/s/p 1:02:22 } +2024-07-30 05:07:22,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 478/ 3125], loss: 0.275, per_step_time: 1412ms, lr: 1.9491736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:22,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.66274 samples/s/p 1:02:19 } +2024-07-30 05:07:25,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 480/ 3125], loss: 0.237, per_step_time: 1412ms, lr: 1.9464371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:25,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.66244 samples/s/p 1:02:16 } +2024-07-30 05:07:27,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 482/ 3125], loss: 0.415, per_step_time: 1413ms, lr: 1.9437023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:27,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.66014 samples/s/p 1:02:15 } +2024-07-30 05:07:30,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 484/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 1.9409688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:30,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.65910 samples/s/p 1:02:13 } +2024-07-30 05:07:33,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 486/ 3125], loss: 0.109, per_step_time: 1413ms, lr: 1.938237e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:33,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.66094 samples/s/p 1:02:09 } +2024-07-30 05:07:36,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 488/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 1.9355055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:36,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.66030 samples/s/p 1:02:07 } +2024-07-30 05:07:39,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 490/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 1.9327765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:39,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.66086 samples/s/p 1:02:03 } +2024-07-30 05:07:42,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 492/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 1.930049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:42,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.66063 samples/s/p 1:02:01 } +2024-07-30 05:07:44,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 494/ 3125], loss: 0.271, per_step_time: 1414ms, lr: 1.9273227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:44,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.65745 samples/s/p 1:02:00 } +2024-07-30 05:07:47,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 496/ 3125], loss: 0.438, per_step_time: 1413ms, lr: 1.924598e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:47,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |███████████████████████████████████ | 5.66139 samples/s/p 1:01:54 } +2024-07-30 05:07:50,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 498/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 1.9218742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:50,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |███████████████████████████████████ | 5.65829 samples/s/p 1:01:54 } +2024-07-30 05:07:53,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 500/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 1.9191523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:53,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.66086 samples/s/p 1:01:49 } +2024-07-30 05:07:56,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 502/ 3125], loss: 0.083, per_step_time: 1415ms, lr: 1.916431e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:56,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.65241 samples/s/p 1:01:52 } +2024-07-30 05:07:59,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 504/ 3125], loss: 0.214, per_step_time: 1414ms, lr: 1.9137126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:59,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.65698 samples/s/p 1:01:46 } +2024-07-30 05:08:01,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 506/ 3125], loss: 0.513, per_step_time: 1414ms, lr: 1.9109953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:01,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.65739 samples/s/p 1:01:43 } +2024-07-30 05:08:04,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 508/ 3125], loss: 0.122, per_step_time: 1418ms, lr: 1.9082795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:04,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.63782 samples/s/p 1:01:53 } +2024-07-30 05:08:07,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 510/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 1.9055652e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:07,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.65956 samples/s/p 1:01:36 } +2024-07-30 05:08:10,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 512/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 1.9028523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:10,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.65971 samples/s/p 1:01:33 } +2024-07-30 05:08:13,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 514/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 1.9001409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:13,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.66074 samples/s/p 1:01:29 } +2024-07-30 05:08:16,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 516/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 1.89743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:16,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.65986 samples/s/p 1:01:27 } +2024-07-30 05:08:18,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 518/ 3125], loss: 0.083, per_step_time: 1414ms, lr: 1.8947217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:18,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.65729 samples/s/p 1:01:26 } +2024-07-30 05:08:21,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 520/ 3125], loss: 0.139, per_step_time: 1415ms, lr: 1.8920147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:21,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.65013 samples/s/p 1:01:28 } +2024-07-30 05:08:24,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 522/ 3125], loss: 0.269, per_step_time: 1414ms, lr: 1.8893084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:24,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.65617 samples/s/p 1:01:21 } +2024-07-30 05:08:27,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 524/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 1.8866044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:27,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.66090 samples/s/p 1:01:15 } +2024-07-30 05:08:30,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 526/ 3125], loss: 0.138, per_step_time: 1414ms, lr: 1.8839019e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:30,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.65684 samples/s/p 1:01:15 } +2024-07-30 05:08:33,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 528/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 1.8812009e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:33,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.66092 samples/s/p 1:01:10 } +2024-07-30 05:08:35,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 530/ 3125], loss: 0.005, per_step_time: 1412ms, lr: 1.8785005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:35,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.66319 samples/s/p 1:01:05 } +2024-07-30 05:08:38,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 532/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 1.8758026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:38,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.65808 samples/s/p 1:01:06 } +2024-07-30 05:08:41,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 534/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 1.873106e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:41,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.66095 samples/s/p 1:01:01 } +2024-07-30 05:08:44,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 536/ 3125], loss: 0.301, per_step_time: 1413ms, lr: 1.870411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:44,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.65938 samples/s/p 1:00:59 } +2024-07-30 05:08:47,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 538/ 3125], loss: 0.510, per_step_time: 1413ms, lr: 1.8677174e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:47,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.66019 samples/s/p 1:00:56 } +2024-07-30 05:08:50,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 540/ 3125], loss: 0.125, per_step_time: 1414ms, lr: 1.8650254e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:50,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.65508 samples/s/p 1:00:56 } +2024-07-30 05:08:52,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 542/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 1.862334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:52,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.65999 samples/s/p 1:00:50 } +2024-07-30 05:08:55,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 544/ 3125], loss: 0.156, per_step_time: 1412ms, lr: 1.859645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:55,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.66180 samples/s/p 1:00:46 } +2024-07-30 05:08:58,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 546/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 1.8569565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:58,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.66120 samples/s/p 1:00:44 } +2024-07-30 05:09:01,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 548/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 1.8542704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:01,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.66107 samples/s/p 1:00:41 } +2024-07-30 05:09:04,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 550/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 1.8515858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:04,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.66111 samples/s/p 1:00:38 } +2024-07-30 05:09:07,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 552/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 1.8489027e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:07,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.66096 samples/s/p 1:00:36 } +2024-07-30 05:09:09,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 554/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 1.8462214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:09,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.65978 samples/s/p 1:00:34 } +2024-07-30 05:09:12,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 556/ 3125], loss: 0.197, per_step_time: 1413ms, lr: 1.8435412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:12,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.66082 samples/s/p 1:00:30 } +2024-07-30 05:09:15,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 558/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 1.8408629e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:15,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.65866 samples/s/p 1:00:29 } +2024-07-30 05:09:18,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 560/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 1.8381849e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:18,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.65748 samples/s/p 1:00:27 } +2024-07-30 05:09:21,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 562/ 3125], loss: 0.268, per_step_time: 1417ms, lr: 1.8355095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:21,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.64553 samples/s/p 1:00:31 } +2024-07-30 05:09:24,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 564/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 1.8328357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:24,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.65997 samples/s/p 1:00:19 } +2024-07-30 05:09:26,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 566/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 1.8301621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:26,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.66073 samples/s/p 1:00:16 } +2024-07-30 05:09:29,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 568/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 1.8274911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:29,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.65993 samples/s/p 1:00:14 } +2024-07-30 05:09:32,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 570/ 3125], loss: 0.294, per_step_time: 1413ms, lr: 1.8248218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:32,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.65946 samples/s/p 1:00:11 } +2024-07-30 05:09:35,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 572/ 3125], loss: 0.232, per_step_time: 1414ms, lr: 1.8221535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:35,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.65724 samples/s/p 1:00:10 } +2024-07-30 05:09:38,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 574/ 3125], loss: 0.064, per_step_time: 1413ms, lr: 1.8194863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:38,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.65862 samples/s/p 1:00:06 } +2024-07-30 05:09:41,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 576/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 1.8168216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:41,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.65837 samples/s/p 1:00:03 } +2024-07-30 05:09:43,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 578/ 3125], loss: 0.265, per_step_time: 1415ms, lr: 1.8141582e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:43,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.65325 samples/s/p 1:00:04 } +2024-07-30 05:09:46,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 580/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 1.8114963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:46,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.65953 samples/s/p 0:59:57 } +2024-07-30 05:09:49,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 582/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 1.8088361e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:49,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.65930 samples/s/p 0:59:54 } +2024-07-30 05:09:52,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 584/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 1.8061771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:52,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.66013 samples/s/p 0:59:51 } +2024-07-30 05:09:55,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 586/ 3125], loss: 0.202, per_step_time: 1414ms, lr: 1.8035188e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:55,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.65534 samples/s/p 0:59:51 } +2024-07-30 05:09:58,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 588/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 1.8008631e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:58,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.66044 samples/s/p 0:59:45 } +2024-07-30 05:10:00,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 590/ 3125], loss: 0.138, per_step_time: 1415ms, lr: 1.798208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:00,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.65147 samples/s/p 0:59:48 } +2024-07-30 05:10:03,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 592/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 1.7955554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:03,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.66002 samples/s/p 0:59:40 } +2024-07-30 05:10:06,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 594/ 3125], loss: 0.130, per_step_time: 1413ms, lr: 1.7929044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:06,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.65907 samples/s/p 0:59:37 } +2024-07-30 05:10:09,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 596/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 1.7902544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:09,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.66162 samples/s/p 0:59:33 } +2024-07-30 05:10:12,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 598/ 3125], loss: 0.323, per_step_time: 1413ms, lr: 1.7876064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:12,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.66068 samples/s/p 0:59:31 } +2024-07-30 05:10:15,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 600/ 3125], loss: 0.395, per_step_time: 1413ms, lr: 1.7849596e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:15,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.65980 samples/s/p 0:59:29 } +2024-07-30 05:10:17,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 602/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 1.7823138e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:17,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.65794 samples/s/p 0:59:27 } +2024-07-30 05:10:20,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 604/ 3125], loss: 0.134, per_step_time: 1413ms, lr: 1.7796704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:20,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.65945 samples/s/p 0:59:23 } +2024-07-30 05:10:23,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 606/ 3125], loss: 0.142, per_step_time: 1413ms, lr: 1.7770287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:23,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.65791 samples/s/p 0:59:21 } +2024-07-30 05:10:26,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 608/ 3125], loss: 0.591, per_step_time: 1413ms, lr: 1.7743882e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:26,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.65890 samples/s/p 0:59:18 } +2024-07-30 05:10:29,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 610/ 3125], loss: 0.108, per_step_time: 1414ms, lr: 1.771748e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:29,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.65760 samples/s/p 0:59:16 } +2024-07-30 05:10:32,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 612/ 3125], loss: 0.229, per_step_time: 1415ms, lr: 1.7691108e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:32,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.65243 samples/s/p 0:59:16 } +2024-07-30 05:10:34,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 614/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 1.7664751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:34,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.66051 samples/s/p 0:59:08 } +2024-07-30 05:10:37,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 616/ 3125], loss: 0.183, per_step_time: 1414ms, lr: 1.7638399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:37,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.65683 samples/s/p 0:59:08 } +2024-07-30 05:10:40,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 618/ 3125], loss: 0.164, per_step_time: 1414ms, lr: 1.7612073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:40,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.65768 samples/s/p 0:59:04 } +2024-07-30 05:10:43,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 620/ 3125], loss: 0.065, per_step_time: 1412ms, lr: 1.758576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:43,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.66271 samples/s/p 0:58:58 } +2024-07-30 05:10:46,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 622/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 1.7559465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:46,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.66100 samples/s/p 0:58:57 } +2024-07-30 05:10:49,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 624/ 3125], loss: 0.520, per_step_time: 1413ms, lr: 1.7533185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:49,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.66043 samples/s/p 0:58:54 } +2024-07-30 05:10:51,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 626/ 3125], loss: 0.100, per_step_time: 1413ms, lr: 1.750692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:51,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.66011 samples/s/p 0:58:52 } +2024-07-30 05:10:54,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 628/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 1.7480671e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:54,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.66044 samples/s/p 0:58:49 } +2024-07-30 05:10:57,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 630/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 1.7454427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:57,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.65907 samples/s/p 0:58:47 } +2024-07-30 05:11:00,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 632/ 3125], loss: 0.305, per_step_time: 1415ms, lr: 1.7428207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:00,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.65235 samples/s/p 0:58:48 } +2024-07-30 05:11:03,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 634/ 3125], loss: 0.278, per_step_time: 1415ms, lr: 1.7401995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:03,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.65113 samples/s/p 0:58:46 } +2024-07-30 05:11:06,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 636/ 3125], loss: 0.082, per_step_time: 1413ms, lr: 1.7375809e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:06,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.66151 samples/s/p 0:58:37 } +2024-07-30 05:11:08,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 638/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 1.7349636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:08,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.65901 samples/s/p 0:58:35 } +2024-07-30 05:11:11,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 640/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 1.7323479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:11,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.66028 samples/s/p 0:58:32 } +2024-07-30 05:11:14,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 642/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 1.7297339e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:14,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.66100 samples/s/p 0:58:28 } +2024-07-30 05:11:17,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 644/ 3125], loss: 0.400, per_step_time: 1413ms, lr: 1.7271215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:17,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.65978 samples/s/p 0:58:26 } +2024-07-30 05:11:20,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 646/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 1.7245095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:20,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.66139 samples/s/p 0:58:23 } +2024-07-30 05:11:23,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 648/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 1.7219004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:23,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.66021 samples/s/p 0:58:20 } +2024-07-30 05:11:25,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 650/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 1.7192924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:25,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.65844 samples/s/p 0:58:19 } +2024-07-30 05:11:28,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 652/ 3125], loss: 0.326, per_step_time: 1414ms, lr: 1.7166861e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:28,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.65570 samples/s/p 0:58:18 } +2024-07-30 05:11:31,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 654/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 1.7140806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:31,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.66013 samples/s/p 0:58:12 } +2024-07-30 05:11:34,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 656/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 1.7114774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:34,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.66073 samples/s/p 0:58:09 } +2024-07-30 05:11:37,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 658/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 1.7088759e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:37,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.65997 samples/s/p 0:58:06 } +2024-07-30 05:11:40,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 660/ 3125], loss: 0.120, per_step_time: 1413ms, lr: 1.706275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:40,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.66132 samples/s/p 0:58:03 } +2024-07-30 05:11:42,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 662/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 1.7036765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:42,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.65937 samples/s/p 0:58:01 } +2024-07-30 05:11:45,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 664/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 1.7010799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:45,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.66090 samples/s/p 0:57:57 } +2024-07-30 05:11:48,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 666/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 1.6984844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:48,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.65790 samples/s/p 0:57:56 } +2024-07-30 05:11:51,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 668/ 3125], loss: 0.145, per_step_time: 1413ms, lr: 1.695891e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:51,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.65916 samples/s/p 0:57:53 } +2024-07-30 05:11:54,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 670/ 3125], loss: 0.207, per_step_time: 1414ms, lr: 1.6932988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:54,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.65661 samples/s/p 0:57:52 } +2024-07-30 05:11:57,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 672/ 3125], loss: 0.271, per_step_time: 1415ms, lr: 1.690708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:57,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.65095 samples/s/p 0:57:52 } +2024-07-30 05:11:59,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 674/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 1.6881182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:59,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.65959 samples/s/p 0:57:44 } +2024-07-30 05:12:02,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 676/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 1.6855311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:02,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.65796 samples/s/p 0:57:42 } +2024-07-30 05:12:05,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 678/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 1.6829442e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:05,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.66080 samples/s/p 0:57:38 } +2024-07-30 05:12:08,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 680/ 3125], loss: 0.234, per_step_time: 1412ms, lr: 1.6803601e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:08,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.66215 samples/s/p 0:57:34 } +2024-07-30 05:12:11,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 682/ 3125], loss: 0.263, per_step_time: 1414ms, lr: 1.6777774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:11,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.65720 samples/s/p 0:57:34 } +2024-07-30 05:12:14,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 684/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 1.6751966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:14,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |████████████████████████████████████ | 5.66131 samples/s/p 0:57:29 } +2024-07-30 05:12:16,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 686/ 3125], loss: 0.592, per_step_time: 1413ms, lr: 1.6726168e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:16,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |████████████████████████████████████ | 5.66069 samples/s/p 0:57:26 } +2024-07-30 05:12:19,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 688/ 3125], loss: 0.160, per_step_time: 1413ms, lr: 1.670038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:19,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.66037 samples/s/p 0:57:24 } +2024-07-30 05:12:22,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 690/ 3125], loss: 0.201, per_step_time: 1414ms, lr: 1.6674619e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:22,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.65652 samples/s/p 0:57:23 } +2024-07-30 05:12:25,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 692/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 1.6648873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:25,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.65926 samples/s/p 0:57:19 } +2024-07-30 05:12:28,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 694/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 1.6623145e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:28,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.66075 samples/s/p 0:57:15 } +2024-07-30 05:12:31,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 696/ 3125], loss: 0.287, per_step_time: 1412ms, lr: 1.6597429e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:31,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.66203 samples/s/p 0:57:11 } +2024-07-30 05:12:33,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 698/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 1.657173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:33,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.66059 samples/s/p 0:57:10 } +2024-07-30 05:12:36,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 700/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 1.6546037e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:36,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.66029 samples/s/p 0:57:07 } +2024-07-30 05:12:39,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 702/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 1.6520369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:39,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.65814 samples/s/p 0:57:05 } +2024-07-30 05:12:42,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 704/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 1.6494708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:42,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.65850 samples/s/p 0:57:02 } +2024-07-30 05:12:45,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 706/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 1.6469075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:45,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.65820 samples/s/p 0:57:00 } +2024-07-30 05:12:48,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 708/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 1.6443457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:48,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.65754 samples/s/p 0:56:57 } +2024-07-30 05:12:50,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 710/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 1.6417855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:50,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.65850 samples/s/p 0:56:54 } +2024-07-30 05:12:53,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 712/ 3125], loss: 0.073, per_step_time: 1413ms, lr: 1.6392266e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:53,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.65815 samples/s/p 0:56:51 } +2024-07-30 05:12:56,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 714/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 1.6366696e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:56,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.65943 samples/s/p 0:56:48 } +2024-07-30 05:12:59,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 716/ 3125], loss: 0.282, per_step_time: 1414ms, lr: 1.6341144e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:59,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.65725 samples/s/p 0:56:46 } +2024-07-30 05:13:02,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 718/ 3125], loss: 0.419, per_step_time: 1413ms, lr: 1.6315594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:02,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.66105 samples/s/p 0:56:41 } +2024-07-30 05:13:05,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 720/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 1.6290071e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:05,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.65931 samples/s/p 0:56:39 } +2024-07-30 05:13:07,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 722/ 3125], loss: 0.433, per_step_time: 1413ms, lr: 1.6264567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:07,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.65992 samples/s/p 0:56:36 } +2024-07-30 05:13:10,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 724/ 3125], loss: 0.184, per_step_time: 1414ms, lr: 1.6239064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:10,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.65714 samples/s/p 0:56:35 } +2024-07-30 05:13:13,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 726/ 3125], loss: 0.217, per_step_time: 1414ms, lr: 1.6213589e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:13,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.65693 samples/s/p 0:56:32 } +2024-07-30 05:13:16,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 728/ 3125], loss: 0.267, per_step_time: 1414ms, lr: 1.6188135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:16,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.65739 samples/s/p 0:56:29 } +2024-07-30 05:13:19,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 730/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 1.6162691e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:19,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.66151 samples/s/p 0:56:24 } +2024-07-30 05:13:22,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 732/ 3125], loss: 0.114, per_step_time: 1413ms, lr: 1.6137257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:22,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.65985 samples/s/p 0:56:22 } +2024-07-30 05:13:24,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 734/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 1.6111848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:24,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.65930 samples/s/p 0:56:19 } +2024-07-30 05:13:27,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 736/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 1.6086453e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:27,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.65919 samples/s/p 0:56:17 } +2024-07-30 05:13:30,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 738/ 3125], loss: 0.389, per_step_time: 1414ms, lr: 1.6061076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:30,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.65569 samples/s/p 0:56:16 } +2024-07-30 05:13:33,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 740/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 1.6035715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:33,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.65858 samples/s/p 0:56:11 } +2024-07-30 05:13:36,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 742/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 1.6010371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:36,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.66044 samples/s/p 0:56:07 } +2024-07-30 05:13:39,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 744/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 1.5985032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:39,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.65999 samples/s/p 0:56:05 } +2024-07-30 05:13:42,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 746/ 3125], loss: 0.112, per_step_time: 1412ms, lr: 1.5959721e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:42,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.66197 samples/s/p 0:56:01 } +2024-07-30 05:13:44,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 748/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 1.5934413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:44,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.66004 samples/s/p 0:55:59 } +2024-07-30 05:13:47,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 750/ 3125], loss: 0.348, per_step_time: 1413ms, lr: 1.5909135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:47,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.65955 samples/s/p 0:55:57 } +2024-07-30 05:13:47,669 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 05:14:24,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 752/ 3125], loss: 0.167, per_step_time: 2695ms, lr: 1.5883871e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:24,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 2.96806 samples/s/p 1:46:36 } +2024-07-30 05:14:26,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 754/ 3125], loss: 0.306, per_step_time: 1414ms, lr: 1.5858626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:26,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.65736 samples/s/p 0:55:52 } +2024-07-30 05:14:29,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 756/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 1.5833392e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:29,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.66037 samples/s/p 0:55:48 } +2024-07-30 05:14:32,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 758/ 3125], loss: 0.194, per_step_time: 1414ms, lr: 1.5808176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:32,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.65560 samples/s/p 0:55:48 } +2024-07-30 05:14:35,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 760/ 3125], loss: 0.140, per_step_time: 1415ms, lr: 1.5782979e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:35,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.65124 samples/s/p 0:55:47 } +2024-07-30 05:14:38,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 762/ 3125], loss: 0.289, per_step_time: 1414ms, lr: 1.5757787e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:38,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.65441 samples/s/p 0:55:43 } +2024-07-30 05:14:41,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 764/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 1.5732625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:41,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.66108 samples/s/p 0:55:36 } +2024-07-30 05:14:44,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 766/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 1.5707475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:44,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.66151 samples/s/p 0:55:33 } +2024-07-30 05:14:47,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 768/ 3125], loss: 0.225, per_step_time: 1416ms, lr: 1.5682333e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:47,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.64670 samples/s/p 0:55:39 } +2024-07-30 05:14:50,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 770/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 1.5657216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:50,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.66071 samples/s/p 0:55:28 } +2024-07-30 05:14:53,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 772/ 3125], loss: 0.538, per_step_time: 1414ms, lr: 1.5632113e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:53,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.65722 samples/s/p 0:55:27 } +2024-07-30 05:14:55,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 774/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 1.5607031e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:55,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.65933 samples/s/p 0:55:23 } +2024-07-30 05:14:58,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 776/ 3125], loss: 0.176, per_step_time: 1412ms, lr: 1.5581957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:58,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.66214 samples/s/p 0:55:18 } +2024-07-30 05:15:01,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 778/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 1.5556905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:01,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.65899 samples/s/p 0:55:17 } +2024-07-30 05:15:04,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 780/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 1.5531871e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:04,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.65880 samples/s/p 0:55:15 } +2024-07-30 05:15:07,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 782/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 1.5506852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:07,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.66008 samples/s/p 0:55:11 } +2024-07-30 05:15:10,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 784/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 1.548185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:10,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.65987 samples/s/p 0:55:08 } +2024-07-30 05:15:13,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 786/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 1.5456867e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:13,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.65906 samples/s/p 0:55:06 } +2024-07-30 05:15:16,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 788/ 3125], loss: 0.313, per_step_time: 1414ms, lr: 1.543189e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:16,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.65770 samples/s/p 0:55:04 } +2024-07-30 05:15:19,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 790/ 3125], loss: 0.309, per_step_time: 1415ms, lr: 1.5406936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:19,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.65338 samples/s/p 0:55:04 } +2024-07-30 05:15:22,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 792/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 1.5381992e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:22,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.65965 samples/s/p 0:54:57 } +2024-07-30 05:15:24,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 794/ 3125], loss: 0.405, per_step_time: 1413ms, lr: 1.5357074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:24,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.65839 samples/s/p 0:54:55 } +2024-07-30 05:15:27,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 796/ 3125], loss: 0.059, per_step_time: 1414ms, lr: 1.5332171e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:27,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.65578 samples/s/p 0:54:54 } +2024-07-30 05:15:30,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 798/ 3125], loss: 0.459, per_step_time: 1415ms, lr: 1.5307284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:30,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.65319 samples/s/p 0:54:53 } +2024-07-30 05:15:33,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 800/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 1.5282416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:33,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.65777 samples/s/p 0:54:47 } +2024-07-30 05:15:36,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 802/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 1.525756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:36,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.65845 samples/s/p 0:54:44 } +2024-07-30 05:15:39,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 804/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 1.5232717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:39,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.66004 samples/s/p 0:54:40 } +2024-07-30 05:15:42,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 806/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 1.5207895e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:42,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.65961 samples/s/p 0:54:37 } +2024-07-30 05:15:44,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 808/ 3125], loss: 0.235, per_step_time: 1414ms, lr: 1.5183094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:44,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.65477 samples/s/p 0:54:37 } +2024-07-30 05:15:47,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 810/ 3125], loss: 0.235, per_step_time: 1413ms, lr: 1.5158307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:47,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.65895 samples/s/p 0:54:32 } +2024-07-30 05:15:50,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 812/ 3125], loss: 0.385, per_step_time: 1413ms, lr: 1.5133529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:50,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.66089 samples/s/p 0:54:28 } +2024-07-30 05:15:53,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 814/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 1.5108776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:53,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.65819 samples/s/p 0:54:27 } +2024-07-30 05:15:56,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 816/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 1.508404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:56,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.66033 samples/s/p 0:54:23 } +2024-07-30 05:15:59,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 818/ 3125], loss: 0.181, per_step_time: 1418ms, lr: 1.5059313e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:59,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.63803 samples/s/p 0:54:33 } +2024-07-30 05:16:01,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 820/ 3125], loss: 0.269, per_step_time: 1412ms, lr: 1.5034607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:01,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.66211 samples/s/p 0:54:16 } +2024-07-30 05:16:04,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 822/ 3125], loss: 0.343, per_step_time: 1414ms, lr: 1.5009921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:04,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.65621 samples/s/p 0:54:17 } +2024-07-30 05:16:07,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 824/ 3125], loss: 0.420, per_step_time: 1413ms, lr: 1.4985251e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:07,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.66116 samples/s/p 0:54:11 } +2024-07-30 05:16:10,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 826/ 3125], loss: 0.120, per_step_time: 1415ms, lr: 1.4960599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:10,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.65270 samples/s/p 0:54:13 } +2024-07-30 05:16:13,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 828/ 3125], loss: 0.141, per_step_time: 1415ms, lr: 1.4935964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:13,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.65035 samples/s/p 0:54:12 } +2024-07-30 05:16:16,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 830/ 3125], loss: 0.413, per_step_time: 1414ms, lr: 1.4911344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:16,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.65448 samples/s/p 0:54:06 } +2024-07-30 05:16:18,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 832/ 3125], loss: 0.234, per_step_time: 1414ms, lr: 1.4886731e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:18,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.65399 samples/s/p 0:54:04 } +2024-07-30 05:16:21,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 834/ 3125], loss: 0.438, per_step_time: 1412ms, lr: 1.4862144e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:21,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.66298 samples/s/p 0:53:56 } +2024-07-30 05:16:24,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 836/ 3125], loss: 0.238, per_step_time: 1412ms, lr: 1.4837568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:24,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.66251 samples/s/p 0:53:53 } +2024-07-30 05:16:27,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 838/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 1.4813014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:27,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.66019 samples/s/p 0:53:52 } +2024-07-30 05:16:30,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 840/ 3125], loss: 0.145, per_step_time: 1413ms, lr: 1.4788482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:30,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.66040 samples/s/p 0:53:49 } +2024-07-30 05:16:33,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 842/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 1.4763963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:33,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.65866 samples/s/p 0:53:47 } +2024-07-30 05:16:35,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 844/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 1.473946e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:35,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.65864 samples/s/p 0:53:44 } +2024-07-30 05:16:38,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 846/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 1.4714974e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:38,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.65991 samples/s/p 0:53:41 } +2024-07-30 05:16:41,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 848/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 1.4690497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:41,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.66103 samples/s/p 0:53:37 } +2024-07-30 05:16:44,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 850/ 3125], loss: 0.104, per_step_time: 1413ms, lr: 1.4666044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:44,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.65931 samples/s/p 0:53:35 } +2024-07-30 05:16:47,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 852/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 1.4641612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:47,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.66089 samples/s/p 0:53:32 } +2024-07-30 05:16:50,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 854/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 1.4617192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:50,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.65868 samples/s/p 0:53:30 } +2024-07-30 05:16:52,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 856/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 1.4592785e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:52,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.66125 samples/s/p 0:53:26 } +2024-07-30 05:16:55,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 858/ 3125], loss: 0.118, per_step_time: 1414ms, lr: 1.45684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:55,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.65582 samples/s/p 0:53:26 } +2024-07-30 05:16:58,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 860/ 3125], loss: 0.421, per_step_time: 1415ms, lr: 1.4544033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:58,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.65288 samples/s/p 0:53:25 } +2024-07-30 05:17:01,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 862/ 3125], loss: 0.449, per_step_time: 1413ms, lr: 1.4519674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:01,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.65792 samples/s/p 0:53:19 } +2024-07-30 05:17:04,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 864/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 1.4495342e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:04,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.65981 samples/s/p 0:53:15 } +2024-07-30 05:17:07,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 866/ 3125], loss: 0.387, per_step_time: 1415ms, lr: 1.4471024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:07,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.65208 samples/s/p 0:53:17 } +2024-07-30 05:17:09,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 868/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 1.4446726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:09,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.65828 samples/s/p 0:53:11 } +2024-07-30 05:17:12,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 870/ 3125], loss: 0.101, per_step_time: 1416ms, lr: 1.4422443e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:12,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.64763 samples/s/p 0:53:14 } +2024-07-30 05:17:15,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 872/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 1.4398178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:15,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |█████████████████████████████████████ | 5.66006 samples/s/p 0:53:04 } +2024-07-30 05:17:18,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 874/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 1.4373928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:18,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |█████████████████████████████████████ | 5.66035 samples/s/p 0:53:01 } +2024-07-30 05:17:21,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 876/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 1.434969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:21,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.66083 samples/s/p 0:52:58 } +2024-07-30 05:17:24,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 878/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 1.4325475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:24,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.65924 samples/s/p 0:52:56 } +2024-07-30 05:17:26,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 880/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 1.430127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:26,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.66151 samples/s/p 0:52:52 } +2024-07-30 05:17:29,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 882/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 1.4277089e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:29,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.65913 samples/s/p 0:52:50 } +2024-07-30 05:17:32,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 884/ 3125], loss: 0.320, per_step_time: 1413ms, lr: 1.4252928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:32,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.65914 samples/s/p 0:52:47 } +2024-07-30 05:17:35,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 886/ 3125], loss: 0.484, per_step_time: 1413ms, lr: 1.4228782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:35,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.65933 samples/s/p 0:52:45 } +2024-07-30 05:17:38,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 888/ 3125], loss: 0.222, per_step_time: 1414ms, lr: 1.4204651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:38,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.65755 samples/s/p 0:52:43 } +2024-07-30 05:17:41,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 890/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 1.4180529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:41,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.66024 samples/s/p 0:52:38 } +2024-07-30 05:17:43,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 892/ 3125], loss: 0.288, per_step_time: 1414ms, lr: 1.4156436e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:43,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.65571 samples/s/p 0:52:38 } +2024-07-30 05:17:46,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 894/ 3125], loss: 0.214, per_step_time: 1414ms, lr: 1.413236e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:46,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.65618 samples/s/p 0:52:35 } +2024-07-30 05:17:49,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 896/ 3125], loss: 0.374, per_step_time: 1412ms, lr: 1.41083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:49,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.66206 samples/s/p 0:52:29 } +2024-07-30 05:17:52,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 898/ 3125], loss: 0.380, per_step_time: 1413ms, lr: 1.4084255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:52,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.65937 samples/s/p 0:52:28 } +2024-07-30 05:17:55,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 900/ 3125], loss: 0.492, per_step_time: 1413ms, lr: 1.406022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:55,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.65904 samples/s/p 0:52:25 } +2024-07-30 05:17:58,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 902/ 3125], loss: 0.128, per_step_time: 1414ms, lr: 1.4036211e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:58,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.65557 samples/s/p 0:52:24 } +2024-07-30 05:18:00,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 904/ 3125], loss: 0.187, per_step_time: 1418ms, lr: 1.401222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:00,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.63919 samples/s/p 0:52:30 } +2024-07-30 05:18:03,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 906/ 3125], loss: 0.287, per_step_time: 1415ms, lr: 1.3988235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:03,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.65367 samples/s/p 0:52:19 } +2024-07-30 05:18:06,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 908/ 3125], loss: 0.194, per_step_time: 1414ms, lr: 1.396428e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:06,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.65668 samples/s/p 0:52:15 } +2024-07-30 05:18:09,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 910/ 3125], loss: 0.370, per_step_time: 1414ms, lr: 1.3940337e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:09,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.65666 samples/s/p 0:52:12 } +2024-07-30 05:18:12,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 912/ 3125], loss: 0.139, per_step_time: 1414ms, lr: 1.3916415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:12,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.65746 samples/s/p 0:52:09 } +2024-07-30 05:18:15,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 914/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 1.389251e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:15,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.65941 samples/s/p 0:52:05 } +2024-07-30 05:18:17,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 916/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 1.3868621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:17,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.65997 samples/s/p 0:52:02 } +2024-07-30 05:18:20,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 918/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 1.3844749e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:20,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.65970 samples/s/p 0:51:59 } +2024-07-30 05:18:23,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 920/ 3125], loss: 0.399, per_step_time: 1413ms, lr: 1.3820886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:23,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.66063 samples/s/p 0:51:56 } +2024-07-30 05:18:26,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 922/ 3125], loss: 0.454, per_step_time: 1413ms, lr: 1.379705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:26,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.65948 samples/s/p 0:51:54 } +2024-07-30 05:18:29,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 924/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 1.3773221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:29,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.66019 samples/s/p 0:51:50 } +2024-07-30 05:18:32,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 926/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 1.374942e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:32,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.66169 samples/s/p 0:51:47 } +2024-07-30 05:18:34,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 928/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 1.3725635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:34,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.65957 samples/s/p 0:51:45 } +2024-07-30 05:18:37,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 930/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 1.3701865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:37,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.65922 samples/s/p 0:51:42 } +2024-07-30 05:18:40,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 932/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 1.3678115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:40,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.65811 samples/s/p 0:51:40 } +2024-07-30 05:18:43,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 934/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 1.3654375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:43,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.65916 samples/s/p 0:51:37 } +2024-07-30 05:18:46,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 936/ 3125], loss: 0.172, per_step_time: 1414ms, lr: 1.3630661e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:46,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.65724 samples/s/p 0:51:35 } +2024-07-30 05:18:49,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 938/ 3125], loss: 0.381, per_step_time: 1414ms, lr: 1.3606963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:49,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.65488 samples/s/p 0:51:33 } +2024-07-30 05:18:51,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 940/ 3125], loss: 0.368, per_step_time: 1413ms, lr: 1.3583282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:51,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.65885 samples/s/p 0:51:28 } +2024-07-30 05:18:54,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 942/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 1.3559616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:54,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.65916 samples/s/p 0:51:25 } +2024-07-30 05:18:57,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 944/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 1.3535961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:57,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.65965 samples/s/p 0:51:22 } +2024-07-30 05:19:00,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 946/ 3125], loss: 0.322, per_step_time: 1413ms, lr: 1.3512334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:00,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.66072 samples/s/p 0:51:19 } +2024-07-30 05:19:03,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 948/ 3125], loss: 0.154, per_step_time: 1412ms, lr: 1.3488716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:03,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.66183 samples/s/p 0:51:16 } +2024-07-30 05:19:06,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 950/ 3125], loss: 0.323, per_step_time: 1417ms, lr: 1.3465121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:06,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.64222 samples/s/p 0:51:23 } +2024-07-30 05:19:08,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 952/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 1.3441542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:08,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.65925 samples/s/p 0:51:11 } +2024-07-30 05:19:11,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 954/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 1.3417986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:11,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.66071 samples/s/p 0:51:08 } +2024-07-30 05:19:14,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 956/ 3125], loss: 0.491, per_step_time: 1413ms, lr: 1.3394442e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:14,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.65928 samples/s/p 0:51:06 } +2024-07-30 05:19:17,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 958/ 3125], loss: 0.460, per_step_time: 1413ms, lr: 1.3370919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:17,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.65864 samples/s/p 0:51:03 } +2024-07-30 05:19:20,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 960/ 3125], loss: 0.228, per_step_time: 1414ms, lr: 1.3347413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:20,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.65714 samples/s/p 0:51:01 } +2024-07-30 05:19:23,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 962/ 3125], loss: 0.367, per_step_time: 1413ms, lr: 1.3323923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:23,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.65882 samples/s/p 0:50:57 } +2024-07-30 05:19:25,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 964/ 3125], loss: 0.162, per_step_time: 1414ms, lr: 1.3300445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:25,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.65640 samples/s/p 0:50:56 } +2024-07-30 05:19:28,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 966/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 1.3276988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:28,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.65949 samples/s/p 0:50:51 } +2024-07-30 05:19:31,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 968/ 3125], loss: 0.222, per_step_time: 1414ms, lr: 1.3253546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:31,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.65628 samples/s/p 0:50:50 } +2024-07-30 05:19:34,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 970/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 1.3230127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:34,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.66120 samples/s/p 0:50:45 } +2024-07-30 05:19:37,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 972/ 3125], loss: 0.278, per_step_time: 1414ms, lr: 1.3206726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:37,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.65738 samples/s/p 0:50:44 } +2024-07-30 05:19:40,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 974/ 3125], loss: 0.165, per_step_time: 1414ms, lr: 1.3183341e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:40,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.65734 samples/s/p 0:50:41 } +2024-07-30 05:19:42,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 976/ 3125], loss: 0.179, per_step_time: 1414ms, lr: 1.3159975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:42,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.65399 samples/s/p 0:50:40 } +2024-07-30 05:19:45,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 978/ 3125], loss: 0.212, per_step_time: 1415ms, lr: 1.3136619e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:45,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.65176 samples/s/p 0:50:39 } +2024-07-30 05:19:48,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 980/ 3125], loss: 0.332, per_step_time: 1416ms, lr: 1.3113287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:48,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.64623 samples/s/p 0:50:39 } +2024-07-30 05:19:51,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 982/ 3125], loss: 0.478, per_step_time: 1414ms, lr: 1.3089972e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:51,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.65490 samples/s/p 0:50:31 } +2024-07-30 05:19:54,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 984/ 3125], loss: 0.330, per_step_time: 1413ms, lr: 1.3066679e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:54,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.66111 samples/s/p 0:50:25 } +2024-07-30 05:19:57,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 986/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 1.30434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:57,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.65806 samples/s/p 0:50:24 } +2024-07-30 05:19:59,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 988/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 1.302014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:59,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.65985 samples/s/p 0:50:20 } +2024-07-30 05:20:02,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 990/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 1.2996887e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:02,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.66161 samples/s/p 0:50:16 } +2024-07-30 05:20:05,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 992/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 1.2973654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:05,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.65823 samples/s/p 0:50:15 } +2024-07-30 05:20:08,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 994/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 1.2950447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:08,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.65908 samples/s/p 0:50:12 } +2024-07-30 05:20:11,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 996/ 3125], loss: 0.069, per_step_time: 1413ms, lr: 1.2927258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:11,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.66035 samples/s/p 0:50:09 } +2024-07-30 05:20:14,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 998/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 1.2904086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:14,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.65972 samples/s/p 0:50:06 } +2024-07-30 05:20:16,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1000/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 1.288093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:16,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.66117 samples/s/p 0:50:02 } +2024-07-30 05:20:19,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1002/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 1.2857795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:19,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.66002 samples/s/p 0:50:00 } +2024-07-30 05:20:22,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1004/ 3125], loss: 0.308, per_step_time: 1412ms, lr: 1.2834673e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:22,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.66230 samples/s/p 0:49:56 } +2024-07-30 05:20:25,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1006/ 3125], loss: 0.276, per_step_time: 1416ms, lr: 1.2811565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:25,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.64949 samples/s/p 0:50:00 } +2024-07-30 05:20:28,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1008/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 1.2788483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:28,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.65954 samples/s/p 0:49:52 } +2024-07-30 05:20:31,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1010/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 1.2765416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:31,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.66033 samples/s/p 0:49:49 } +2024-07-30 05:20:33,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1012/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 1.2742358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:33,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.65950 samples/s/p 0:49:46 } +2024-07-30 05:20:36,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1014/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 1.271933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:36,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.65578 samples/s/p 0:49:45 } +2024-07-30 05:20:39,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1016/ 3125], loss: 0.141, per_step_time: 1414ms, lr: 1.2696316e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:39,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.65769 samples/s/p 0:49:42 } +2024-07-30 05:20:42,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1018/ 3125], loss: 0.217, per_step_time: 1414ms, lr: 1.2673321e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:42,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.65735 samples/s/p 0:49:39 } +2024-07-30 05:20:45,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1020/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 1.2650338e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:45,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.65823 samples/s/p 0:49:36 } +2024-07-30 05:20:48,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1022/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 1.2627381e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:48,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.65779 samples/s/p 0:49:33 } +2024-07-30 05:20:51,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1024/ 3125], loss: 0.189, per_step_time: 1414ms, lr: 1.2604439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:51,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.65550 samples/s/p 0:49:31 } +2024-07-30 05:20:53,840 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1026/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 1.2581515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:53,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.66064 samples/s/p 0:49:26 } +2024-07-30 05:20:56,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1028/ 3125], loss: 0.138, per_step_time: 1415ms, lr: 1.2558612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:56,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.65107 samples/s/p 0:49:28 } +2024-07-30 05:20:59,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1030/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 1.2535721e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:59,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.66056 samples/s/p 0:49:20 } +2024-07-30 05:21:02,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1032/ 3125], loss: 0.270, per_step_time: 1414ms, lr: 1.2512851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:02,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.65504 samples/s/p 0:49:20 } +2024-07-30 05:21:05,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1034/ 3125], loss: 0.368, per_step_time: 1413ms, lr: 1.2489995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:05,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.65977 samples/s/p 0:49:15 } +2024-07-30 05:21:08,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1036/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 1.2467151e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:08,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.66061 samples/s/p 0:49:12 } +2024-07-30 05:21:10,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1038/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 1.2444335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:10,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.65995 samples/s/p 0:49:09 } +2024-07-30 05:21:13,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1040/ 3125], loss: 0.436, per_step_time: 1413ms, lr: 1.2421536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:13,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.66164 samples/s/p 0:49:06 } +2024-07-30 05:21:16,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1042/ 3125], loss: 0.456, per_step_time: 1413ms, lr: 1.2398758e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:16,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.65859 samples/s/p 0:49:04 } +2024-07-30 05:21:19,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1044/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 1.2375996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:19,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.65876 samples/s/p 0:49:01 } +2024-07-30 05:21:22,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1046/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 1.2353253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:22,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.66025 samples/s/p 0:48:58 } +2024-07-30 05:21:25,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1048/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 1.2330526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:25,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.66030 samples/s/p 0:48:55 } +2024-07-30 05:21:27,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1050/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 1.2307808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:27,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.66135 samples/s/p 0:48:52 } +2024-07-30 05:21:30,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1052/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 1.2285119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:30,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.65933 samples/s/p 0:48:50 } +2024-07-30 05:21:33,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1054/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 1.2262445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:33,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.65958 samples/s/p 0:48:47 } +2024-07-30 05:21:36,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1056/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 1.2239792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:36,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.65890 samples/s/p 0:48:44 } +2024-07-30 05:21:39,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1058/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 1.2217149e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:39,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.65891 samples/s/p 0:48:42 } +2024-07-30 05:21:42,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1060/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 1.2194532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:42,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.65949 samples/s/p 0:48:38 } +2024-07-30 05:21:44,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1062/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 1.2171932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:44,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.65950 samples/s/p 0:48:36 } +2024-07-30 05:21:47,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1064/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 1.214934e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:47,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |███████████████████████████████████████ | 5.66025 samples/s/p 0:48:32 } +2024-07-30 05:21:50,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1066/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 1.2126776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:50,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |███████████████████████████████████████ | 5.65897 samples/s/p 0:48:30 } +2024-07-30 05:21:53,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1068/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 1.2104231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:53,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.65842 samples/s/p 0:48:28 } +2024-07-30 05:21:56,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1070/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 1.2081704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:56,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.66064 samples/s/p 0:48:24 } +2024-07-30 05:21:59,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1072/ 3125], loss: 0.303, per_step_time: 1414ms, lr: 1.2059196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:59,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.65676 samples/s/p 0:48:23 } +2024-07-30 05:22:01,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1074/ 3125], loss: 0.290, per_step_time: 1414ms, lr: 1.2036704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:01,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.65404 samples/s/p 0:48:21 } +2024-07-30 05:22:04,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1076/ 3125], loss: 0.046, per_step_time: 1412ms, lr: 1.2014228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:04,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.66180 samples/s/p 0:48:15 } +2024-07-30 05:22:07,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1078/ 3125], loss: 0.306, per_step_time: 1414ms, lr: 1.1991766e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:07,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.65758 samples/s/p 0:48:14 } +2024-07-30 05:22:10,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1080/ 3125], loss: 0.406, per_step_time: 1414ms, lr: 1.1969328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:10,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.65511 samples/s/p 0:48:12 } +2024-07-30 05:22:13,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1082/ 3125], loss: 0.318, per_step_time: 1414ms, lr: 1.1946902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:13,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.65695 samples/s/p 0:48:09 } +2024-07-30 05:22:16,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1084/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 1.1924502e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:16,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.66107 samples/s/p 0:48:04 } +2024-07-30 05:22:18,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1086/ 3125], loss: 0.321, per_step_time: 1413ms, lr: 1.1902121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:18,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.66096 samples/s/p 0:48:01 } +2024-07-30 05:22:21,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1088/ 3125], loss: 0.171, per_step_time: 1415ms, lr: 1.1879754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:21,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.65276 samples/s/p 0:48:02 } +2024-07-30 05:22:24,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1090/ 3125], loss: 0.352, per_step_time: 1414ms, lr: 1.1857411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:24,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.65728 samples/s/p 0:47:57 } +2024-07-30 05:22:27,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1092/ 3125], loss: 0.198, per_step_time: 1414ms, lr: 1.1835074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:27,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.65548 samples/s/p 0:47:55 } +2024-07-30 05:22:30,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1094/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 1.1812764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:30,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.66137 samples/s/p 0:47:49 } +2024-07-30 05:22:33,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1096/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 1.1790472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:33,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.66056 samples/s/p 0:47:47 } +2024-07-30 05:22:35,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1098/ 3125], loss: 0.470, per_step_time: 1414ms, lr: 1.1768198e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:35,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.65734 samples/s/p 0:47:46 } +2024-07-30 05:22:38,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1100/ 3125], loss: 0.447, per_step_time: 1414ms, lr: 1.1745944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:38,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.65429 samples/s/p 0:47:45 } +2024-07-30 05:22:41,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1102/ 3125], loss: 0.428, per_step_time: 1413ms, lr: 1.1723699e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:41,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.66072 samples/s/p 0:47:39 } +2024-07-30 05:22:44,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1104/ 3125], loss: 0.231, per_step_time: 1412ms, lr: 1.1701483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:44,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.66216 samples/s/p 0:47:35 } +2024-07-30 05:22:47,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1106/ 3125], loss: 0.515, per_step_time: 1413ms, lr: 1.167928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:47,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.65920 samples/s/p 0:47:34 } +2024-07-30 05:22:50,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1108/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 1.1657089e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:50,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.65895 samples/s/p 0:47:31 } +2024-07-30 05:22:52,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1110/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 1.1634928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:52,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.65783 samples/s/p 0:47:29 } +2024-07-30 05:22:55,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1112/ 3125], loss: 0.417, per_step_time: 1415ms, lr: 1.1612782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:55,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.65204 samples/s/p 0:47:29 } +2024-07-30 05:22:58,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1114/ 3125], loss: 0.305, per_step_time: 1415ms, lr: 1.1590654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:58,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.65325 samples/s/p 0:47:25 } +2024-07-30 05:23:01,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1116/ 3125], loss: 0.349, per_step_time: 1413ms, lr: 1.1568549e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:01,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.65960 samples/s/p 0:47:19 } +2024-07-30 05:23:04,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1118/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 1.1546457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:04,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.65882 samples/s/p 0:47:17 } +2024-07-30 05:23:07,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1120/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 1.1524385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:07,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.65801 samples/s/p 0:47:14 } +2024-07-30 05:23:09,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1122/ 3125], loss: 0.327, per_step_time: 1413ms, lr: 1.1502325e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:09,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.66018 samples/s/p 0:47:11 } +2024-07-30 05:23:12,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1124/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 1.1480287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:12,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.66026 samples/s/p 0:47:08 } +2024-07-30 05:23:15,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1126/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 1.1458262e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:15,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.66098 samples/s/p 0:47:04 } +2024-07-30 05:23:18,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1128/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 1.1436265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:18,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.66050 samples/s/p 0:47:02 } +2024-07-30 05:23:21,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1130/ 3125], loss: 0.113, per_step_time: 1413ms, lr: 1.1414284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:21,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.66133 samples/s/p 0:46:59 } +2024-07-30 05:23:24,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1132/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 1.1392325e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:24,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.66108 samples/s/p 0:46:56 } +2024-07-30 05:23:26,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1134/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 1.1370381e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:26,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.65902 samples/s/p 0:46:54 } +2024-07-30 05:23:29,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1136/ 3125], loss: 0.082, per_step_time: 1412ms, lr: 1.1348446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:29,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.66203 samples/s/p 0:46:50 } +2024-07-30 05:23:32,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1138/ 3125], loss: 0.260, per_step_time: 1414ms, lr: 1.1326542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:32,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.65738 samples/s/p 0:46:49 } +2024-07-30 05:23:35,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1140/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 1.1304655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:35,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.66088 samples/s/p 0:46:45 } +2024-07-30 05:23:38,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1142/ 3125], loss: 0.176, per_step_time: 1413ms, lr: 1.1282783e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:38,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.66144 samples/s/p 0:46:42 } +2024-07-30 05:23:41,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1144/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 1.1260936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:41,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.65826 samples/s/p 0:46:40 } +2024-07-30 05:23:43,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1146/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 1.1239093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:43,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.65898 samples/s/p 0:46:37 } +2024-07-30 05:23:46,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1148/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 1.1217281e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:46,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.65584 samples/s/p 0:46:36 } +2024-07-30 05:23:49,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1150/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 1.1195477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:49,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.65839 samples/s/p 0:46:32 } +2024-07-30 05:23:52,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1152/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 1.1173704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:52,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.66060 samples/s/p 0:46:28 } +2024-07-30 05:23:55,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1154/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 1.1151942e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:55,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.66080 samples/s/p 0:46:25 } +2024-07-30 05:23:58,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1156/ 3125], loss: 0.473, per_step_time: 1413ms, lr: 1.1130204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:58,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.66100 samples/s/p 0:46:22 } +2024-07-30 05:24:00,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1158/ 3125], loss: 0.317, per_step_time: 1414ms, lr: 1.1108484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:00,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.65743 samples/s/p 0:46:21 } +2024-07-30 05:24:03,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1160/ 3125], loss: 0.223, per_step_time: 1416ms, lr: 1.1086782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:03,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.64609 samples/s/p 0:46:24 } +2024-07-30 05:24:06,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1162/ 3125], loss: 0.360, per_step_time: 1414ms, lr: 1.1065096e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:06,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.65576 samples/s/p 0:46:16 } +2024-07-30 05:24:09,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1164/ 3125], loss: 0.130, per_step_time: 1413ms, lr: 1.1043423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:09,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.65904 samples/s/p 0:46:12 } +2024-07-30 05:24:12,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1166/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 1.1021775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:12,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.66052 samples/s/p 0:46:08 } +2024-07-30 05:24:15,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1168/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 1.1000147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:15,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.65920 samples/s/p 0:46:06 } +2024-07-30 05:24:17,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1170/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 1.0978531e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:17,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.66038 samples/s/p 0:46:03 } +2024-07-30 05:24:20,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1172/ 3125], loss: 0.636, per_step_time: 1413ms, lr: 1.0956943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:20,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.65803 samples/s/p 0:46:01 } +2024-07-30 05:24:23,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1174/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 1.0935369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:23,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.65813 samples/s/p 0:45:58 } +2024-07-30 05:24:26,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1176/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 1.0913816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:26,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.66006 samples/s/p 0:45:54 } +2024-07-30 05:24:29,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1178/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 1.0892278e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:29,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.65940 samples/s/p 0:45:52 } +2024-07-30 05:24:32,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1180/ 3125], loss: 0.293, per_step_time: 1417ms, lr: 1.0870757e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:32,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.64504 samples/s/p 0:45:56 } +2024-07-30 05:24:34,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1182/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 1.0849258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:34,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.66141 samples/s/p 0:45:45 } +2024-07-30 05:24:37,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1184/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 1.082778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:37,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.65906 samples/s/p 0:45:43 } +2024-07-30 05:24:40,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1186/ 3125], loss: 0.209, per_step_time: 1415ms, lr: 1.0806319e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:40,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.65198 samples/s/p 0:45:44 } +2024-07-30 05:24:43,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1188/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 1.0784879e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:43,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.65834 samples/s/p 0:45:38 } +2024-07-30 05:24:46,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1190/ 3125], loss: 0.440, per_step_time: 1413ms, lr: 1.0763446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:46,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.66072 samples/s/p 0:45:34 } +2024-07-30 05:24:49,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1192/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 1.0742044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:49,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.66070 samples/s/p 0:45:31 } +2024-07-30 05:24:51,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1194/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 1.0720652e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:51,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.66041 samples/s/p 0:45:29 } +2024-07-30 05:24:54,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1196/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 1.0699284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:54,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.66083 samples/s/p 0:45:26 } +2024-07-30 05:24:57,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1198/ 3125], loss: 0.130, per_step_time: 1414ms, lr: 1.0677936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:57,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.65660 samples/s/p 0:45:25 } +2024-07-30 05:25:00,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1200/ 3125], loss: 0.418, per_step_time: 1414ms, lr: 1.0656607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:00,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.65674 samples/s/p 0:45:22 } +2024-07-30 05:25:03,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1202/ 3125], loss: 0.381, per_step_time: 1415ms, lr: 1.0635296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:03,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.65154 samples/s/p 0:45:22 } +2024-07-30 05:25:06,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1204/ 3125], loss: 0.090, per_step_time: 1416ms, lr: 1.0614004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:06,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.64736 samples/s/p 0:45:21 } +2024-07-30 05:25:08,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1206/ 3125], loss: 0.344, per_step_time: 1416ms, lr: 1.0592731e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:08,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.64617 samples/s/p 0:45:19 } +2024-07-30 05:25:11,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1208/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 1.0571473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:11,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.66034 samples/s/p 0:45:09 } +2024-07-30 05:25:14,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1210/ 3125], loss: 0.137, per_step_time: 1412ms, lr: 1.055024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:14,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.66259 samples/s/p 0:45:05 } +2024-07-30 05:25:17,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1212/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 1.0529023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:17,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.65932 samples/s/p 0:45:04 } +2024-07-30 05:25:20,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1214/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 1.0507816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:20,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.66070 samples/s/p 0:45:00 } +2024-07-30 05:25:23,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1216/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 1.0486639e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:23,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.65983 samples/s/p 0:44:58 } +2024-07-30 05:25:25,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1218/ 3125], loss: 0.406, per_step_time: 1413ms, lr: 1.0465478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:25,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.65983 samples/s/p 0:44:55 } +2024-07-30 05:25:28,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1220/ 3125], loss: 0.091, per_step_time: 1413ms, lr: 1.0444339e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:28,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.66011 samples/s/p 0:44:52 } +2024-07-30 05:25:31,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1222/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 1.0423207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:31,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.66046 samples/s/p 0:44:49 } +2024-07-30 05:25:34,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1224/ 3125], loss: 0.416, per_step_time: 1413ms, lr: 1.0402107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:34,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.66045 samples/s/p 0:44:46 } +2024-07-30 05:25:37,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1226/ 3125], loss: 0.082, per_step_time: 1413ms, lr: 1.0381021e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:37,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.66122 samples/s/p 0:44:43 } +2024-07-30 05:25:40,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1228/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 1.0359954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:40,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.66028 samples/s/p 0:44:41 } +2024-07-30 05:25:42,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1230/ 3125], loss: 0.169, per_step_time: 1412ms, lr: 1.0338911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:42,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.66206 samples/s/p 0:44:37 } +2024-07-30 05:25:45,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1232/ 3125], loss: 0.450, per_step_time: 1413ms, lr: 1.0317883e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:45,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.65987 samples/s/p 0:44:35 } +2024-07-30 05:25:48,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1234/ 3125], loss: 0.128, per_step_time: 1414ms, lr: 1.0296869e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:48,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.65756 samples/s/p 0:44:33 } +2024-07-30 05:25:51,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1236/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 1.0275876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:51,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.66026 samples/s/p 0:44:29 } +2024-07-30 05:25:54,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1238/ 3125], loss: 0.423, per_step_time: 1416ms, lr: 1.0254902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:54,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.64796 samples/s/p 0:44:32 } +2024-07-30 05:25:57,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1240/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 1.023395e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:57,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.66109 samples/s/p 0:44:23 } +2024-07-30 05:25:59,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1242/ 3125], loss: 0.130, per_step_time: 1413ms, lr: 1.0213017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:59,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.66088 samples/s/p 0:44:21 } +2024-07-30 05:26:02,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1244/ 3125], loss: 0.291, per_step_time: 1413ms, lr: 1.0192105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:02,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.66077 samples/s/p 0:44:18 } +2024-07-30 05:26:05,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1246/ 3125], loss: 0.129, per_step_time: 1414ms, lr: 1.0171208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:05,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |███████████████████████████████████████ | 5.65533 samples/s/p 0:44:18 } +2024-07-30 05:26:08,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1248/ 3125], loss: 0.165, per_step_time: 1415ms, lr: 1.0150334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:08,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |███████████████████████████████████████ | 5.65240 samples/s/p 0:44:16 } +2024-07-30 05:26:11,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1250/ 3125], loss: 0.405, per_step_time: 1413ms, lr: 1.0129478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:11,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.65923 samples/s/p 0:44:10 } +2024-07-30 05:26:14,140 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1252/ 3125], loss: 0.290, per_step_time: 1414ms, lr: 1.0108635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:14,140 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.65730 samples/s/p 0:44:08 } +2024-07-30 05:26:16,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1254/ 3125], loss: 0.194, per_step_time: 1415ms, lr: 1.0087817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:16,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.65043 samples/s/p 0:44:09 } +2024-07-30 05:26:19,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1256/ 3125], loss: 0.357, per_step_time: 1414ms, lr: 1.0067016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:19,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.65728 samples/s/p 0:44:02 } +2024-07-30 05:26:22,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1258/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 1.0046228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:22,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.65774 samples/s/p 0:43:59 } +2024-07-30 05:26:25,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1260/ 3125], loss: 0.385, per_step_time: 1413ms, lr: 1.0025468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:25,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.66074 samples/s/p 0:43:55 } +2024-07-30 05:26:28,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1262/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 1.0004726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:28,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.65946 samples/s/p 0:43:53 } +2024-07-30 05:26:31,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1264/ 3125], loss: 0.344, per_step_time: 1414ms, lr: 9.984001e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:31,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.65404 samples/s/p 0:43:53 } +2024-07-30 05:26:33,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1266/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 9.963288e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:33,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.65932 samples/s/p 0:43:47 } +2024-07-30 05:26:36,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1268/ 3125], loss: 0.256, per_step_time: 1412ms, lr: 9.942609e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:36,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.66273 samples/s/p 0:43:43 } +2024-07-30 05:26:39,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1270/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 9.921941e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:39,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.66023 samples/s/p 0:43:41 } +2024-07-30 05:26:42,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1272/ 3125], loss: 0.419, per_step_time: 1419ms, lr: 9.901294e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:42,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.63515 samples/s/p 0:43:50 } +2024-07-30 05:26:45,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1274/ 3125], loss: 0.539, per_step_time: 1413ms, lr: 9.880667e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:45,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.66007 samples/s/p 0:43:36 } +2024-07-30 05:26:48,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1276/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 9.86006e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:48,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.66096 samples/s/p 0:43:32 } +2024-07-30 05:26:50,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1278/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 9.839463e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:50,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.66043 samples/s/p 0:43:30 } +2024-07-30 05:26:53,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1280/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 9.818893e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:53,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.66022 samples/s/p 0:43:27 } +2024-07-30 05:26:56,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1282/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 9.798335e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:56,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.65928 samples/s/p 0:43:25 } +2024-07-30 05:26:59,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1284/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 9.777805e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:59,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.65975 samples/s/p 0:43:22 } +2024-07-30 05:27:02,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1286/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 9.757292e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:02,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.66091 samples/s/p 0:43:18 } +2024-07-30 05:27:05,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1288/ 3125], loss: 0.435, per_step_time: 1413ms, lr: 9.7368e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:05,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.66040 samples/s/p 0:43:16 } +2024-07-30 05:27:08,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1290/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 9.716326e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:08,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.66066 samples/s/p 0:43:13 } +2024-07-30 05:27:10,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1292/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 9.695873e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:10,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.65967 samples/s/p 0:43:10 } +2024-07-30 05:27:13,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1294/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 9.675427e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:13,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.66009 samples/s/p 0:43:07 } +2024-07-30 05:27:16,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1296/ 3125], loss: 0.406, per_step_time: 1413ms, lr: 9.655014e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:16,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.66039 samples/s/p 0:43:04 } +2024-07-30 05:27:19,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1298/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 9.634616e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:19,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.65885 samples/s/p 0:43:02 } +2024-07-30 05:27:22,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1300/ 3125], loss: 0.304, per_step_time: 1412ms, lr: 9.614238e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:22,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.66318 samples/s/p 0:42:58 } +2024-07-30 05:27:25,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1302/ 3125], loss: 0.200, per_step_time: 1415ms, lr: 9.593874e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:25,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.65264 samples/s/p 0:43:00 } +2024-07-30 05:27:27,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1304/ 3125], loss: 0.065, per_step_time: 1413ms, lr: 9.573533e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:27,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.66162 samples/s/p 0:42:53 } +2024-07-30 05:27:30,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1306/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 9.553214e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:30,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.65771 samples/s/p 0:42:52 } +2024-07-30 05:27:33,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1308/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 9.532913e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:33,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.65441 samples/s/p 0:42:50 } +2024-07-30 05:27:36,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1310/ 3125], loss: 0.153, per_step_time: 1414ms, lr: 9.512627e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:36,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.65714 samples/s/p 0:42:46 } +2024-07-30 05:27:39,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1312/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 9.4923644e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:39,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.65984 samples/s/p 0:42:42 } +2024-07-30 05:27:42,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1314/ 3125], loss: 0.175, per_step_time: 1412ms, lr: 9.4721196e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:42,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.66182 samples/s/p 0:42:38 } +2024-07-30 05:27:44,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1316/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 9.4518987e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:44,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.65989 samples/s/p 0:42:36 } +2024-07-30 05:27:47,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1318/ 3125], loss: 0.449, per_step_time: 1413ms, lr: 9.4316925e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:47,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.66109 samples/s/p 0:42:33 } +2024-07-30 05:27:50,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1320/ 3125], loss: 0.109, per_step_time: 1413ms, lr: 9.4115137e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:50,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.66070 samples/s/p 0:42:30 } +2024-07-30 05:27:53,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1322/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 9.391346e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:53,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.65928 samples/s/p 0:42:28 } +2024-07-30 05:27:56,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1324/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 9.371191e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:56,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.66095 samples/s/p 0:42:25 } +2024-07-30 05:27:59,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1326/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 9.3510596e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:59,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.66016 samples/s/p 0:42:22 } +2024-07-30 05:28:01,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1328/ 3125], loss: 0.412, per_step_time: 1413ms, lr: 9.330952e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:01,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.65922 samples/s/p 0:42:20 } +2024-07-30 05:28:04,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1330/ 3125], loss: 0.522, per_step_time: 1414ms, lr: 9.310865e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:04,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.65534 samples/s/p 0:42:19 } +2024-07-30 05:28:07,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1332/ 3125], loss: 0.282, per_step_time: 1415ms, lr: 9.2907993e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:07,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.65310 samples/s/p 0:42:17 } +2024-07-30 05:28:10,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1334/ 3125], loss: 0.511, per_step_time: 1413ms, lr: 9.270751e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:10,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.65938 samples/s/p 0:42:11 } +2024-07-30 05:28:13,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1336/ 3125], loss: 0.386, per_step_time: 1414ms, lr: 9.2507213e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:13,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.65605 samples/s/p 0:42:10 } +2024-07-30 05:28:16,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1338/ 3125], loss: 0.166, per_step_time: 1414ms, lr: 9.230703e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:16,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.65728 samples/s/p 0:42:07 } +2024-07-30 05:28:18,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1340/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 9.2107143e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:18,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.65814 samples/s/p 0:42:03 } +2024-07-30 05:28:21,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1342/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 9.190744e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:21,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.65829 samples/s/p 0:42:00 } +2024-07-30 05:28:24,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1344/ 3125], loss: 0.151, per_step_time: 1413ms, lr: 9.1707915e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:24,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.66000 samples/s/p 0:41:57 } +2024-07-30 05:28:27,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1346/ 3125], loss: 0.495, per_step_time: 1413ms, lr: 9.1508593e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:27,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.66066 samples/s/p 0:41:54 } +2024-07-30 05:28:30,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1348/ 3125], loss: 0.077, per_step_time: 1413ms, lr: 9.1309425e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:30,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.66084 samples/s/p 0:41:51 } +2024-07-30 05:28:33,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1350/ 3125], loss: 0.083, per_step_time: 1413ms, lr: 9.1110496e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:33,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.66144 samples/s/p 0:41:48 } +2024-07-30 05:28:35,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1352/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 9.0911686e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:35,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.65903 samples/s/p 0:41:46 } +2024-07-30 05:28:38,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1354/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 9.071317e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:38,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.65963 samples/s/p 0:41:43 } +2024-07-30 05:28:41,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1356/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 9.0514806e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:41,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.65896 samples/s/p 0:41:40 } +2024-07-30 05:28:44,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1358/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 9.0316684e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:44,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.65993 samples/s/p 0:41:37 } +2024-07-30 05:28:47,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1360/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 9.011873e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:47,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.66106 samples/s/p 0:41:34 } +2024-07-30 05:28:50,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1362/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 8.992097e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:50,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.65842 samples/s/p 0:41:32 } +2024-07-30 05:28:52,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1364/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 8.972341e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:52,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.66056 samples/s/p 0:41:28 } +2024-07-30 05:28:55,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1366/ 3125], loss: 0.187, per_step_time: 1414ms, lr: 8.9526e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:55,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.65676 samples/s/p 0:41:27 } +2024-07-30 05:28:58,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1368/ 3125], loss: 0.402, per_step_time: 1414ms, lr: 8.9328825e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:58,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.65654 samples/s/p 0:41:24 } +2024-07-30 05:29:01,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1370/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 8.913186e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:01,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.66078 samples/s/p 0:41:20 } +2024-07-30 05:29:04,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1372/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 8.8935013e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:04,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.65972 samples/s/p 0:41:17 } +2024-07-30 05:29:07,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1374/ 3125], loss: 0.073, per_step_time: 1413ms, lr: 8.873841e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:07,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.66055 samples/s/p 0:41:14 } +2024-07-30 05:29:09,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1376/ 3125], loss: 0.277, per_step_time: 1412ms, lr: 8.854207e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:09,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.66358 samples/s/p 0:41:10 } +2024-07-30 05:29:12,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1378/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.834588e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:12,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.66088 samples/s/p 0:41:08 } +2024-07-30 05:29:15,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1380/ 3125], loss: 0.412, per_step_time: 1412ms, lr: 8.8149875e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:15,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.66232 samples/s/p 0:41:05 } +2024-07-30 05:29:18,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1382/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 8.795401e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:18,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.65929 samples/s/p 0:41:03 } +2024-07-30 05:29:21,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1384/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 8.7758417e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:21,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.66134 samples/s/p 0:41:00 } +2024-07-30 05:29:24,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1386/ 3125], loss: 0.316, per_step_time: 1414ms, lr: 8.7563006e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:24,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.65641 samples/s/p 0:40:59 } +2024-07-30 05:29:26,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1388/ 3125], loss: 0.225, per_step_time: 1412ms, lr: 8.736783e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:26,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.66264 samples/s/p 0:40:53 } +2024-07-30 05:29:29,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1390/ 3125], loss: 0.344, per_step_time: 1413ms, lr: 8.7172805e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:29,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.65999 samples/s/p 0:40:52 } +2024-07-30 05:29:32,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1392/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 8.697793e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:32,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.66006 samples/s/p 0:40:49 } +2024-07-30 05:29:35,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1394/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 8.678335e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:35,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.66124 samples/s/p 0:40:46 } +2024-07-30 05:29:38,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1396/ 3125], loss: 0.372, per_step_time: 1414ms, lr: 8.658886e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:38,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.65670 samples/s/p 0:40:45 } +2024-07-30 05:29:41,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1398/ 3125], loss: 0.180, per_step_time: 1414ms, lr: 8.6394635e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:41,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.65383 samples/s/p 0:40:43 } +2024-07-30 05:29:43,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1400/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 8.620065e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:43,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.65915 samples/s/p 0:40:38 } +2024-07-30 05:29:46,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1402/ 3125], loss: 0.256, per_step_time: 1415ms, lr: 8.6006816e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:46,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.65276 samples/s/p 0:40:38 } +2024-07-30 05:29:49,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1404/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 8.581319e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:49,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.66120 samples/s/p 0:40:31 } +2024-07-30 05:29:52,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1406/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 8.5619746e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:52,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.66009 samples/s/p 0:40:29 } +2024-07-30 05:29:55,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1408/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 8.5426535e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:55,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.66041 samples/s/p 0:40:26 } +2024-07-30 05:29:58,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1410/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 8.523345e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:58,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.65840 samples/s/p 0:40:24 } +2024-07-30 05:30:00,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1412/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 8.5040597e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:00,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.65996 samples/s/p 0:40:21 } +2024-07-30 05:30:03,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1414/ 3125], loss: 0.133, per_step_time: 1414ms, lr: 8.4847983e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:03,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.65546 samples/s/p 0:40:20 } +2024-07-30 05:30:06,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1416/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 8.4655494e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:06,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.65851 samples/s/p 0:40:16 } +2024-07-30 05:30:09,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1418/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 8.446324e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:09,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.65893 samples/s/p 0:40:13 } +2024-07-30 05:30:12,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1420/ 3125], loss: 0.274, per_step_time: 1425ms, lr: 8.427119e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:12,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.61176 samples/s/p 0:40:30 } +2024-07-30 05:30:15,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1422/ 3125], loss: 0.061, per_step_time: 1413ms, lr: 8.407938e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:15,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.66068 samples/s/p 0:40:06 } +2024-07-30 05:30:17,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1424/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 8.3887664e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:17,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.66013 samples/s/p 0:40:04 } +2024-07-30 05:30:20,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1426/ 3125], loss: 0.204, per_step_time: 1414ms, lr: 8.3696216e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:20,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.65398 samples/s/p 0:40:03 } +2024-07-30 05:30:23,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1428/ 3125], loss: 0.108, per_step_time: 1413ms, lr: 8.3505e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:23,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.66056 samples/s/p 0:39:58 } +2024-07-30 05:30:26,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1430/ 3125], loss: 0.045, per_step_time: 1414ms, lr: 8.331391e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:26,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.65680 samples/s/p 0:39:57 } +2024-07-30 05:30:29,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1432/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 8.3123115e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:29,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.66017 samples/s/p 0:39:52 } +2024-07-30 05:30:32,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1434/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 8.293244e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:32,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |████████████████████████████████████████ | 5.66032 samples/s/p 0:39:49 } +2024-07-30 05:30:34,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1436/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 8.2741946e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:34,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |████████████████████████████████████████ | 5.65809 samples/s/p 0:39:48 } +2024-07-30 05:30:37,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1438/ 3125], loss: 0.568, per_step_time: 1413ms, lr: 8.2551685e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:37,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.65925 samples/s/p 0:39:44 } +2024-07-30 05:30:40,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1440/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 8.236155e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:40,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.66145 samples/s/p 0:39:41 } +2024-07-30 05:30:43,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1442/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 8.217174e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:43,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.66083 samples/s/p 0:39:38 } +2024-07-30 05:30:46,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1444/ 3125], loss: 0.327, per_step_time: 1413ms, lr: 8.1982074e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:46,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.66012 samples/s/p 0:39:35 } +2024-07-30 05:30:49,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1446/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 8.179262e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:49,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.66083 samples/s/p 0:39:32 } +2024-07-30 05:30:51,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1448/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 8.160338e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:51,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.65935 samples/s/p 0:39:30 } +2024-07-30 05:30:54,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1450/ 3125], loss: 0.391, per_step_time: 1413ms, lr: 8.141431e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:54,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.66140 samples/s/p 0:39:26 } +2024-07-30 05:30:57,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1452/ 3125], loss: 0.133, per_step_time: 1416ms, lr: 8.1225454e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:57,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.64579 samples/s/p 0:39:30 } +2024-07-30 05:31:00,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1454/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 8.1036774e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:00,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.65943 samples/s/p 0:39:22 } +2024-07-30 05:31:03,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1456/ 3125], loss: 0.208, per_step_time: 1412ms, lr: 8.0848275e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:03,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.66238 samples/s/p 0:39:18 } +2024-07-30 05:31:06,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1458/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 8.0660044e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:06,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.66095 samples/s/p 0:39:15 } +2024-07-30 05:31:08,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1460/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 8.047193e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:08,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.66092 samples/s/p 0:39:12 } +2024-07-30 05:31:11,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1462/ 3125], loss: 0.264, per_step_time: 1414ms, lr: 8.028409e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:11,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.65647 samples/s/p 0:39:11 } +2024-07-30 05:31:14,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1464/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 8.0096453e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:14,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.66154 samples/s/p 0:39:07 } +2024-07-30 05:31:17,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1466/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 7.9908966e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:17,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.65772 samples/s/p 0:39:05 } +2024-07-30 05:31:20,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1468/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 7.9721656e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:20,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.66105 samples/s/p 0:39:01 } +2024-07-30 05:31:23,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1470/ 3125], loss: 0.457, per_step_time: 1413ms, lr: 7.9534647e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:23,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.65886 samples/s/p 0:38:59 } +2024-07-30 05:31:25,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1472/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 7.9347785e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:25,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.66061 samples/s/p 0:38:56 } +2024-07-30 05:31:28,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1474/ 3125], loss: 0.316, per_step_time: 1415ms, lr: 7.916108e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:28,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.65275 samples/s/p 0:38:56 } +2024-07-30 05:31:31,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1476/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 7.8974665e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:31,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.65916 samples/s/p 0:38:51 } +2024-07-30 05:31:34,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1478/ 3125], loss: 0.465, per_step_time: 1414ms, lr: 7.87884e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:34,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.65705 samples/s/p 0:38:49 } +2024-07-30 05:31:37,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1480/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 7.860231e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:37,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.65776 samples/s/p 0:38:46 } +2024-07-30 05:31:40,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1482/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 7.841646e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:40,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.65853 samples/s/p 0:38:42 } +2024-07-30 05:31:42,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1484/ 3125], loss: 0.245, per_step_time: 1414ms, lr: 7.8230767e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:42,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.65645 samples/s/p 0:38:40 } +2024-07-30 05:31:45,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1486/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 7.804531e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:45,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.65824 samples/s/p 0:38:37 } +2024-07-30 05:31:48,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1488/ 3125], loss: 0.317, per_step_time: 1415ms, lr: 7.7860085e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:48,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.65324 samples/s/p 0:38:36 } +2024-07-30 05:31:51,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1490/ 3125], loss: 0.481, per_step_time: 1412ms, lr: 7.767504e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:51,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.66297 samples/s/p 0:38:29 } +2024-07-30 05:31:54,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1492/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 7.7490176e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:54,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.65998 samples/s/p 0:38:28 } +2024-07-30 05:31:57,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1494/ 3125], loss: 0.196, per_step_time: 1414ms, lr: 7.7305555e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:57,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.65755 samples/s/p 0:38:26 } +2024-07-30 05:31:59,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1496/ 3125], loss: 0.301, per_step_time: 1413ms, lr: 7.7121075e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:59,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.66100 samples/s/p 0:38:22 } +2024-07-30 05:32:02,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1498/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 7.693684e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:02,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.66163 samples/s/p 0:38:18 } +2024-07-30 05:32:05,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1500/ 3125], loss: 0.262, per_step_time: 1415ms, lr: 7.675281e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:05,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.65000 samples/s/p 0:38:20 } +2024-07-30 05:32:08,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1502/ 3125], loss: 0.083, per_step_time: 1413ms, lr: 7.656899e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:08,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.65988 samples/s/p 0:38:14 } +2024-07-30 05:32:11,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1504/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 7.6385317e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:11,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.66133 samples/s/p 0:38:10 } +2024-07-30 05:32:14,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1506/ 3125], loss: 0.193, per_step_time: 1414ms, lr: 7.6201883e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:14,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.65638 samples/s/p 0:38:09 } +2024-07-30 05:32:16,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1508/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 7.601866e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:16,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.66077 samples/s/p 0:38:05 } +2024-07-30 05:32:19,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1510/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 7.583564e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:19,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.65845 samples/s/p 0:38:03 } +2024-07-30 05:32:22,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1512/ 3125], loss: 0.093, per_step_time: 1413ms, lr: 7.5652775e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:22,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.65921 samples/s/p 0:38:00 } +2024-07-30 05:32:25,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1514/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 7.547015e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:25,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.66003 samples/s/p 0:37:57 } +2024-07-30 05:32:28,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1516/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 7.5287755e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:28,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.65931 samples/s/p 0:37:54 } +2024-07-30 05:32:31,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1518/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 7.5105544e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:31,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.65991 samples/s/p 0:37:51 } +2024-07-30 05:32:33,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1520/ 3125], loss: 0.386, per_step_time: 1412ms, lr: 7.492354e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:33,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.66236 samples/s/p 0:37:47 } +2024-07-30 05:32:36,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1522/ 3125], loss: 0.440, per_step_time: 1413ms, lr: 7.474175e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:36,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.65927 samples/s/p 0:37:46 } +2024-07-30 05:32:39,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1524/ 3125], loss: 0.357, per_step_time: 1413ms, lr: 7.4560074e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:39,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.65826 samples/s/p 0:37:43 } +2024-07-30 05:32:42,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1526/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 7.43787e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:42,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.66150 samples/s/p 0:37:39 } +2024-07-30 05:32:45,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1528/ 3125], loss: 0.246, per_step_time: 1414ms, lr: 7.419744e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:45,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.65627 samples/s/p 0:37:38 } +2024-07-30 05:32:48,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1530/ 3125], loss: 0.320, per_step_time: 1413ms, lr: 7.401645e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:48,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.65988 samples/s/p 0:37:34 } +2024-07-30 05:32:50,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1532/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 7.383564e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:50,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.65905 samples/s/p 0:37:31 } +2024-07-30 05:32:53,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1534/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 7.3655065e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:53,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.66124 samples/s/p 0:37:28 } +2024-07-30 05:32:56,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1536/ 3125], loss: 0.302, per_step_time: 1412ms, lr: 7.3474706e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:56,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.66269 samples/s/p 0:37:24 } +2024-07-30 05:32:59,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1538/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 7.3294547e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:59,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.66089 samples/s/p 0:37:22 } +2024-07-30 05:33:02,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1540/ 3125], loss: 0.191, per_step_time: 1414ms, lr: 7.311451e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:02,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.65714 samples/s/p 0:37:21 } +2024-07-30 05:33:05,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1542/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 7.2934745e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:05,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.66106 samples/s/p 0:37:17 } +2024-07-30 05:33:07,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1544/ 3125], loss: 0.098, per_step_time: 1413ms, lr: 7.2755154e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:07,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.66016 samples/s/p 0:37:14 } +2024-07-30 05:33:10,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1546/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 7.2575807e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:10,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.65847 samples/s/p 0:37:12 } +2024-07-30 05:33:13,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1548/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 7.23966e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:13,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.66107 samples/s/p 0:37:08 } +2024-07-30 05:33:16,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1550/ 3125], loss: 0.208, per_step_time: 1414ms, lr: 7.221764e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:16,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.65638 samples/s/p 0:37:07 } +2024-07-30 05:33:19,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1552/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 7.2038887e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:19,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.66025 samples/s/p 0:37:03 } +2024-07-30 05:33:22,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1554/ 3125], loss: 0.220, per_step_time: 1414ms, lr: 7.186028e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:22,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.65724 samples/s/p 0:37:01 } +2024-07-30 05:33:24,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1556/ 3125], loss: 0.212, per_step_time: 1412ms, lr: 7.168197e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:24,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.66295 samples/s/p 0:36:56 } +2024-07-30 05:33:27,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1558/ 3125], loss: 0.151, per_step_time: 1424ms, lr: 7.1503814e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:27,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.61430 samples/s/p 0:37:12 } +2024-07-30 05:33:30,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1560/ 3125], loss: 0.207, per_step_time: 1414ms, lr: 7.1325894e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:30,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.65594 samples/s/p 0:36:53 } +2024-07-30 05:33:33,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1562/ 3125], loss: 0.316, per_step_time: 1414ms, lr: 7.1148185e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:33,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.65645 samples/s/p 0:36:50 } +2024-07-30 05:33:36,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1564/ 3125], loss: 0.232, per_step_time: 1414ms, lr: 7.097065e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:36,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.65454 samples/s/p 0:36:48 } +2024-07-30 05:33:39,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1566/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 7.079333e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:39,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.65788 samples/s/p 0:36:44 } +2024-07-30 05:33:41,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1568/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 7.061618e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:41,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.66026 samples/s/p 0:36:40 } +2024-07-30 05:33:44,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1570/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 7.043928e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:44,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.66037 samples/s/p 0:36:37 } +2024-07-30 05:33:47,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1572/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 7.026252e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:47,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.65974 samples/s/p 0:36:35 } +2024-07-30 05:33:50,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1574/ 3125], loss: 0.055, per_step_time: 1413ms, lr: 7.008603e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:50,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.66147 samples/s/p 0:36:31 } +2024-07-30 05:33:53,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1576/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 6.990972e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:53,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.66143 samples/s/p 0:36:28 } +2024-07-30 05:33:56,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1578/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 6.973365e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:56,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.65895 samples/s/p 0:36:26 } +2024-07-30 05:33:58,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1580/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 6.9557757e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:58,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.65964 samples/s/p 0:36:23 } +2024-07-30 05:34:01,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1582/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 6.93821e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:01,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.65922 samples/s/p 0:36:21 } +2024-07-30 05:34:04,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1584/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 6.920656e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:04,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.66143 samples/s/p 0:36:17 } +2024-07-30 05:34:07,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1586/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 6.9031324e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:07,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.66045 samples/s/p 0:36:15 } +2024-07-30 05:34:10,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1588/ 3125], loss: 0.271, per_step_time: 1416ms, lr: 6.8856235e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:10,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.64731 samples/s/p 0:36:17 } +2024-07-30 05:34:13,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1590/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 6.868142e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:13,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.66157 samples/s/p 0:36:09 } +2024-07-30 05:34:16,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1592/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 6.8506716e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:16,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.65966 samples/s/p 0:36:06 } +2024-07-30 05:34:18,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1594/ 3125], loss: 0.330, per_step_time: 1414ms, lr: 6.833228e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:18,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.65559 samples/s/p 0:36:05 } +2024-07-30 05:34:21,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1596/ 3125], loss: 0.382, per_step_time: 1413ms, lr: 6.8158056e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:21,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.66049 samples/s/p 0:36:00 } +2024-07-30 05:34:24,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1598/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 6.7983956e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:24,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.65883 samples/s/p 0:35:58 } +2024-07-30 05:34:27,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1600/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 6.7810146e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:27,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.65979 samples/s/p 0:35:55 } +2024-07-30 05:34:30,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1602/ 3125], loss: 0.294, per_step_time: 1414ms, lr: 6.763652e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:30,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.65734 samples/s/p 0:35:53 } +2024-07-30 05:34:33,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1604/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 6.74631e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:33,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.65926 samples/s/p 0:35:50 } +2024-07-30 05:34:35,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1606/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 6.7289915e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:35,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.65839 samples/s/p 0:35:47 } +2024-07-30 05:34:38,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1608/ 3125], loss: 0.196, per_step_time: 1414ms, lr: 6.711691e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:38,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.65666 samples/s/p 0:35:45 } +2024-07-30 05:34:41,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1610/ 3125], loss: 0.134, per_step_time: 1413ms, lr: 6.694412e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:41,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.66127 samples/s/p 0:35:40 } +2024-07-30 05:34:44,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1612/ 3125], loss: 0.206, per_step_time: 1415ms, lr: 6.67715e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:44,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.65198 samples/s/p 0:35:41 } +2024-07-30 05:34:47,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1614/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 6.659913e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:47,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.65889 samples/s/p 0:35:36 } +2024-07-30 05:34:50,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1616/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 6.64269e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:50,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.66135 samples/s/p 0:35:32 } +2024-07-30 05:34:52,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1618/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 6.6254944e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:52,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.65943 samples/s/p 0:35:30 } +2024-07-30 05:34:55,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1620/ 3125], loss: 0.217, per_step_time: 1412ms, lr: 6.608319e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:55,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.66191 samples/s/p 0:35:26 } +2024-07-30 05:34:58,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1622/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 6.591165e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:58,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |█████████████████████████████████████████ | 5.66116 samples/s/p 0:35:23 } +2024-07-30 05:35:01,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1624/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 6.574032e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:01,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |█████████████████████████████████████████ | 5.65848 samples/s/p 0:35:22 } +2024-07-30 05:35:04,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1626/ 3125], loss: 0.105, per_step_time: 1414ms, lr: 6.55691e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:04,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.65724 samples/s/p 0:35:19 } +2024-07-30 05:35:07,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1628/ 3125], loss: 0.344, per_step_time: 1419ms, lr: 6.5398183e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:07,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.63565 samples/s/p 0:35:25 } +2024-07-30 05:35:09,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1630/ 3125], loss: 0.373, per_step_time: 1417ms, lr: 6.5227505e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:09,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.64309 samples/s/p 0:35:19 } +2024-07-30 05:35:12,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1632/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 6.505698e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:12,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.66012 samples/s/p 0:35:10 } +2024-07-30 05:35:15,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1634/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 6.488666e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:15,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.65896 samples/s/p 0:35:07 } +2024-07-30 05:35:18,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1636/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 6.471661e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:18,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.65926 samples/s/p 0:35:04 } +2024-07-30 05:35:21,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1638/ 3125], loss: 0.127, per_step_time: 1413ms, lr: 6.4546646e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:21,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.66072 samples/s/p 0:35:01 } +2024-07-30 05:35:24,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1640/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 6.4376917e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:24,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.65920 samples/s/p 0:34:59 } +2024-07-30 05:35:26,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1642/ 3125], loss: 0.100, per_step_time: 1413ms, lr: 6.420746e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:26,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.66062 samples/s/p 0:34:55 } +2024-07-30 05:35:29,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1644/ 3125], loss: 0.177, per_step_time: 1415ms, lr: 6.4038187e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:29,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.65273 samples/s/p 0:34:55 } +2024-07-30 05:35:32,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1646/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 6.386912e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:32,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.66163 samples/s/p 0:34:49 } +2024-07-30 05:35:35,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1648/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 6.3700315e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:35,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.65975 samples/s/p 0:34:47 } +2024-07-30 05:35:38,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1650/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 6.3531667e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:38,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.65891 samples/s/p 0:34:45 } +2024-07-30 05:35:41,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1652/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 6.336322e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:41,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.66125 samples/s/p 0:34:41 } +2024-07-30 05:35:43,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1654/ 3125], loss: 0.257, per_step_time: 1412ms, lr: 6.319502e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:43,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.66202 samples/s/p 0:34:38 } +2024-07-30 05:35:46,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1656/ 3125], loss: 0.157, per_step_time: 1412ms, lr: 6.3026965e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:46,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.66250 samples/s/p 0:34:35 } +2024-07-30 05:35:49,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1658/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 6.285912e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:49,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.65779 samples/s/p 0:34:34 } +2024-07-30 05:35:52,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1660/ 3125], loss: 0.242, per_step_time: 1412ms, lr: 6.269154e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:52,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.66222 samples/s/p 0:34:29 } +2024-07-30 05:35:55,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1662/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 6.2524106e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:55,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.66089 samples/s/p 0:34:27 } +2024-07-30 05:35:58,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1664/ 3125], loss: 0.147, per_step_time: 1415ms, lr: 6.2356946e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:58,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.65190 samples/s/p 0:34:27 } +2024-07-30 05:36:00,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1666/ 3125], loss: 0.201, per_step_time: 1412ms, lr: 6.2189963e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:00,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.66173 samples/s/p 0:34:21 } +2024-07-30 05:36:03,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1668/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 6.202322e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:03,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.65812 samples/s/p 0:34:20 } +2024-07-30 05:36:06,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1670/ 3125], loss: 0.194, per_step_time: 1414ms, lr: 6.1856593e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:06,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.65719 samples/s/p 0:34:17 } +2024-07-30 05:36:09,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1672/ 3125], loss: 0.371, per_step_time: 1414ms, lr: 6.169027e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:09,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.65585 samples/s/p 0:34:15 } +2024-07-30 05:36:12,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1674/ 3125], loss: 0.211, per_step_time: 1414ms, lr: 6.152415e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:12,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.65701 samples/s/p 0:34:11 } +2024-07-30 05:36:15,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1676/ 3125], loss: 0.320, per_step_time: 1413ms, lr: 6.135824e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:15,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.65857 samples/s/p 0:34:08 } +2024-07-30 05:36:17,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1678/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 6.119251e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:17,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.66108 samples/s/p 0:34:04 } +2024-07-30 05:36:20,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1680/ 3125], loss: 0.404, per_step_time: 1412ms, lr: 6.1026986e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:20,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.66178 samples/s/p 0:34:01 } +2024-07-30 05:36:23,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1682/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 6.0861674e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:23,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.65822 samples/s/p 0:34:00 } +2024-07-30 05:36:26,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1684/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 6.069654e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:26,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.66015 samples/s/p 0:33:56 } +2024-07-30 05:36:29,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1686/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 6.053165e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:29,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.66062 samples/s/p 0:33:53 } +2024-07-30 05:36:32,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1688/ 3125], loss: 0.224, per_step_time: 1412ms, lr: 6.036699e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:32,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.66188 samples/s/p 0:33:50 } +2024-07-30 05:36:34,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1690/ 3125], loss: 0.472, per_step_time: 1412ms, lr: 6.0202535e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:34,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.66240 samples/s/p 0:33:47 } +2024-07-30 05:36:37,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1692/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 6.003827e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:37,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.65973 samples/s/p 0:33:45 } +2024-07-30 05:36:40,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1694/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 5.9874264e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:40,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.66057 samples/s/p 0:33:42 } +2024-07-30 05:36:43,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1696/ 3125], loss: 0.134, per_step_time: 1412ms, lr: 5.971044e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:43,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.66209 samples/s/p 0:33:39 } +2024-07-30 05:36:46,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1698/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 5.9546767e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:46,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.66011 samples/s/p 0:33:36 } +2024-07-30 05:36:49,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1700/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 5.938336e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:49,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.65845 samples/s/p 0:33:34 } +2024-07-30 05:36:51,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1702/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 5.922016e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:51,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.65936 samples/s/p 0:33:31 } +2024-07-30 05:36:54,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1704/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 5.9057203e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:54,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.65869 samples/s/p 0:33:28 } +2024-07-30 05:36:57,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1706/ 3125], loss: 0.215, per_step_time: 1415ms, lr: 5.8894364e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:57,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.65349 samples/s/p 0:33:27 } +2024-07-30 05:37:00,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1708/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 5.8731825e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:00,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.65976 samples/s/p 0:33:22 } +2024-07-30 05:37:03,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1710/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 5.856946e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:03,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.65917 samples/s/p 0:33:20 } +2024-07-30 05:37:06,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1712/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 5.8407306e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:06,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.65963 samples/s/p 0:33:17 } +2024-07-30 05:37:08,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1714/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 5.824533e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:08,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.65930 samples/s/p 0:33:14 } +2024-07-30 05:37:11,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1716/ 3125], loss: 0.192, per_step_time: 1414ms, lr: 5.8083623e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:11,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.65440 samples/s/p 0:33:13 } +2024-07-30 05:37:14,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1718/ 3125], loss: 0.193, per_step_time: 1414ms, lr: 5.792209e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:14,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.65555 samples/s/p 0:33:10 } +2024-07-30 05:37:17,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1720/ 3125], loss: 0.420, per_step_time: 1414ms, lr: 5.7760803e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:17,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.65762 samples/s/p 0:33:06 } +2024-07-30 05:37:20,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1722/ 3125], loss: 0.260, per_step_time: 1414ms, lr: 5.759972e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:20,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.65742 samples/s/p 0:33:03 } +2024-07-30 05:37:23,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1724/ 3125], loss: 0.136, per_step_time: 1415ms, lr: 5.7438876e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:23,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.65363 samples/s/p 0:33:02 } +2024-07-30 05:37:25,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1726/ 3125], loss: 0.655, per_step_time: 1415ms, lr: 5.7278123e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:25,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.65262 samples/s/p 0:32:59 } +2024-07-30 05:37:28,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1728/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 5.71177e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:28,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.66091 samples/s/p 0:32:54 } +2024-07-30 05:37:31,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1730/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 5.6957424e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:31,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.66006 samples/s/p 0:32:51 } +2024-07-30 05:37:34,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1732/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 5.6797353e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:34,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.66073 samples/s/p 0:32:48 } +2024-07-30 05:37:37,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1734/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 5.6637555e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:37,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.65966 samples/s/p 0:32:46 } +2024-07-30 05:37:40,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1736/ 3125], loss: 0.166, per_step_time: 1412ms, lr: 5.647793e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:40,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.66193 samples/s/p 0:32:42 } +2024-07-30 05:37:42,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1738/ 3125], loss: 0.089, per_step_time: 1413ms, lr: 5.631855e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:42,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.66059 samples/s/p 0:32:40 } +2024-07-30 05:37:45,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1740/ 3125], loss: 0.575, per_step_time: 1413ms, lr: 5.6159377e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:45,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.66163 samples/s/p 0:32:37 } +2024-07-30 05:37:48,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1742/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 5.600035e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:48,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.65987 samples/s/p 0:32:34 } +2024-07-30 05:37:51,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1744/ 3125], loss: 0.258, per_step_time: 1412ms, lr: 5.5841593e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:51,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.66176 samples/s/p 0:32:31 } +2024-07-30 05:37:54,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1746/ 3125], loss: 0.254, per_step_time: 1412ms, lr: 5.5683046e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:54,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.66270 samples/s/p 0:32:28 } +2024-07-30 05:37:57,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1748/ 3125], loss: 0.137, per_step_time: 1413ms, lr: 5.5524737e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:57,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.65998 samples/s/p 0:32:26 } +2024-07-30 05:37:59,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1750/ 3125], loss: 0.195, per_step_time: 1414ms, lr: 5.536655e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:59,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.65499 samples/s/p 0:32:25 } +2024-07-30 05:38:02,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1752/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 5.5208653e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:02,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.66147 samples/s/p 0:32:20 } +2024-07-30 05:38:05,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1754/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 5.505097e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:05,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.66167 samples/s/p 0:32:17 } +2024-07-30 05:38:08,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1756/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 5.4893405e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:08,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.66024 samples/s/p 0:32:14 } +2024-07-30 05:38:11,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1758/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 5.4736165e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:11,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.65922 samples/s/p 0:32:12 } +2024-07-30 05:38:14,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1760/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 5.457908e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:14,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.66137 samples/s/p 0:32:08 } +2024-07-30 05:38:16,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1762/ 3125], loss: 0.158, per_step_time: 1414ms, lr: 5.442223e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:16,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.65759 samples/s/p 0:32:07 } +2024-07-30 05:38:19,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1764/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 5.4265615e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:19,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.65959 samples/s/p 0:32:03 } +2024-07-30 05:38:22,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1766/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 5.4109216e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:22,589 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.65958 samples/s/p 0:32:00 } +2024-07-30 05:38:25,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1768/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 5.395296e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:25,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.66123 samples/s/p 0:31:57 } +2024-07-30 05:38:28,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1770/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 5.379692e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:28,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.66050 samples/s/p 0:31:55 } +2024-07-30 05:38:31,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1772/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 5.364117e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:31,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.66088 samples/s/p 0:31:52 } +2024-07-30 05:38:33,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1774/ 3125], loss: 0.285, per_step_time: 1414ms, lr: 5.3485513e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:33,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.65724 samples/s/p 0:31:50 } +2024-07-30 05:38:36,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1776/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 5.333021e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:36,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.66126 samples/s/p 0:31:46 } +2024-07-30 05:38:39,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1778/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 5.317503e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:39,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.65904 samples/s/p 0:31:44 } +2024-07-30 05:38:42,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1780/ 3125], loss: 0.378, per_step_time: 1414ms, lr: 5.302012e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:42,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.65722 samples/s/p 0:31:41 } +2024-07-30 05:38:45,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1782/ 3125], loss: 0.191, per_step_time: 1415ms, lr: 5.2865414e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:45,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.65252 samples/s/p 0:31:40 } +2024-07-30 05:38:48,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1784/ 3125], loss: 0.450, per_step_time: 1412ms, lr: 5.271089e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:48,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.66197 samples/s/p 0:31:34 } +2024-07-30 05:38:50,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1786/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 5.2556544e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:50,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.66159 samples/s/p 0:31:32 } +2024-07-30 05:38:53,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1788/ 3125], loss: 0.179, per_step_time: 1415ms, lr: 5.240249e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:53,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.65314 samples/s/p 0:31:32 } +2024-07-30 05:38:56,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1790/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 5.2248623e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:56,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.66014 samples/s/p 0:31:26 } +2024-07-30 05:38:59,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1792/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 5.2094964e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:59,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.66078 samples/s/p 0:31:23 } +2024-07-30 05:39:02,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1794/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 5.194148e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:02,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.65986 samples/s/p 0:31:21 } +2024-07-30 05:39:05,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1796/ 3125], loss: 0.381, per_step_time: 1414ms, lr: 5.178827e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:05,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.65758 samples/s/p 0:31:19 } +2024-07-30 05:39:07,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1798/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 5.1635266e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:07,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.66074 samples/s/p 0:31:15 } +2024-07-30 05:39:10,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1800/ 3125], loss: 0.104, per_step_time: 1413ms, lr: 5.1482436e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:10,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.65783 samples/s/p 0:31:13 } +2024-07-30 05:39:13,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1802/ 3125], loss: 0.427, per_step_time: 1414ms, lr: 5.132985e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:13,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.65706 samples/s/p 0:31:10 } +2024-07-30 05:39:16,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1804/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 5.11775e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:16,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.66043 samples/s/p 0:31:06 } +2024-07-30 05:39:19,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1806/ 3125], loss: 0.253, per_step_time: 1414ms, lr: 5.102533e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:19,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.65450 samples/s/p 0:31:06 } +2024-07-30 05:39:22,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1808/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 5.08734e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:22,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.65813 samples/s/p 0:31:02 } +2024-07-30 05:39:24,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1810/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 5.072167e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:24,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.65941 samples/s/p 0:30:58 } +2024-07-30 05:39:27,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1812/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 5.057019e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:27,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.65952 samples/s/p 0:30:55 } +2024-07-30 05:39:30,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1814/ 3125], loss: 0.128, per_step_time: 1414ms, lr: 5.0418885e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:30,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |███████████████████████████████████████████ | 5.65479 samples/s/p 0:30:54 } +2024-07-30 05:39:33,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1816/ 3125], loss: 0.300, per_step_time: 1414ms, lr: 5.0267784e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:33,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |███████████████████████████████████████████ | 5.65661 samples/s/p 0:30:51 } +2024-07-30 05:39:36,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1818/ 3125], loss: 0.304, per_step_time: 1414ms, lr: 5.0116836e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:36,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.65525 samples/s/p 0:30:48 } +2024-07-30 05:39:39,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1820/ 3125], loss: 0.252, per_step_time: 1415ms, lr: 4.996621e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:39,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.65218 samples/s/p 0:30:47 } +2024-07-30 05:39:41,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1822/ 3125], loss: 0.149, per_step_time: 1415ms, lr: 4.981577e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:41,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.65347 samples/s/p 0:30:43 } +2024-07-30 05:39:44,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1824/ 3125], loss: 0.332, per_step_time: 1414ms, lr: 4.966557e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:44,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.65643 samples/s/p 0:30:40 } +2024-07-30 05:39:47,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1826/ 3125], loss: 0.327, per_step_time: 1414ms, lr: 4.9515575e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:47,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.65501 samples/s/p 0:30:37 } +2024-07-30 05:39:50,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1828/ 3125], loss: 0.129, per_step_time: 1415ms, lr: 4.936573e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:50,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.65181 samples/s/p 0:30:35 } +2024-07-30 05:39:53,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1830/ 3125], loss: 0.336, per_step_time: 1414ms, lr: 4.921615e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:53,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.65440 samples/s/p 0:30:32 } +2024-07-30 05:39:56,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1832/ 3125], loss: 0.366, per_step_time: 1414ms, lr: 4.906681e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:56,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.65414 samples/s/p 0:30:29 } +2024-07-30 05:39:58,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1834/ 3125], loss: 0.434, per_step_time: 1414ms, lr: 4.891765e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:58,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.65445 samples/s/p 0:30:26 } +2024-07-30 05:40:01,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1836/ 3125], loss: 0.215, per_step_time: 1415ms, lr: 4.8768726e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:01,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.65335 samples/s/p 0:30:24 } +2024-07-30 05:40:04,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1838/ 3125], loss: 0.347, per_step_time: 1415ms, lr: 4.8619955e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:04,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.65319 samples/s/p 0:30:21 } +2024-07-30 05:40:07,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1840/ 3125], loss: 0.267, per_step_time: 1414ms, lr: 4.847148e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:07,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.65576 samples/s/p 0:30:17 } +2024-07-30 05:40:10,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1842/ 3125], loss: 0.263, per_step_time: 1414ms, lr: 4.8323153e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:10,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.65537 samples/s/p 0:30:14 } +2024-07-30 05:40:13,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1844/ 3125], loss: 0.343, per_step_time: 1414ms, lr: 4.8175065e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:13,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.65539 samples/s/p 0:30:12 } +2024-07-30 05:40:15,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1846/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 4.802728e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:15,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.66136 samples/s/p 0:30:07 } +2024-07-30 05:40:18,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1848/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 4.7879604e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:18,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.66066 samples/s/p 0:30:04 } +2024-07-30 05:40:21,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1850/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 4.7732203e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:21,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.66016 samples/s/p 0:30:02 } +2024-07-30 05:40:24,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1852/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 4.758501e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:24,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.65956 samples/s/p 0:29:59 } +2024-07-30 05:40:27,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1854/ 3125], loss: 0.448, per_step_time: 1413ms, lr: 4.7438024e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:27,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.66133 samples/s/p 0:29:56 } +2024-07-30 05:40:30,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1856/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 4.7291277e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:30,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.66121 samples/s/p 0:29:53 } +2024-07-30 05:40:32,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1858/ 3125], loss: 0.332, per_step_time: 1414ms, lr: 4.714465e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:32,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.65669 samples/s/p 0:29:51 } +2024-07-30 05:40:35,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1860/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 4.699832e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:35,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.66037 samples/s/p 0:29:47 } +2024-07-30 05:40:38,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1862/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 4.685214e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:38,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.65784 samples/s/p 0:29:45 } +2024-07-30 05:40:41,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1864/ 3125], loss: 0.203, per_step_time: 1414ms, lr: 4.670626e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:41,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.65758 samples/s/p 0:29:43 } +2024-07-30 05:40:44,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1866/ 3125], loss: 0.310, per_step_time: 1414ms, lr: 4.6560555e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:44,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.65675 samples/s/p 0:29:40 } +2024-07-30 05:40:47,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1868/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 4.641509e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:47,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.65800 samples/s/p 0:29:37 } +2024-07-30 05:40:50,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1870/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 4.6269832e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:50,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.65799 samples/s/p 0:29:34 } +2024-07-30 05:40:52,840 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1872/ 3125], loss: 0.387, per_step_time: 1413ms, lr: 4.6124725e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:52,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.66077 samples/s/p 0:29:30 } +2024-07-30 05:40:55,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1874/ 3125], loss: 0.357, per_step_time: 1413ms, lr: 4.5979917e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:55,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.66108 samples/s/p 0:29:27 } +2024-07-30 05:40:58,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1876/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 4.5835316e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:58,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.66057 samples/s/p 0:29:25 } +2024-07-30 05:41:01,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1878/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 4.5690953e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:01,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.66081 samples/s/p 0:29:22 } +2024-07-30 05:41:04,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1880/ 3125], loss: 0.405, per_step_time: 1414ms, lr: 4.554677e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:04,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.65722 samples/s/p 0:29:20 } +2024-07-30 05:41:07,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1882/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 4.5402763e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:07,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.65912 samples/s/p 0:29:17 } +2024-07-30 05:41:09,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1884/ 3125], loss: 0.185, per_step_time: 1414ms, lr: 4.5259057e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:09,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.65628 samples/s/p 0:29:15 } +2024-07-30 05:41:12,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1886/ 3125], loss: 0.212, per_step_time: 1415ms, lr: 4.51155e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:12,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.65359 samples/s/p 0:29:13 } +2024-07-30 05:41:15,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1888/ 3125], loss: 0.370, per_step_time: 1414ms, lr: 4.497218e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:15,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.65600 samples/s/p 0:29:09 } +2024-07-30 05:41:18,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1890/ 3125], loss: 0.436, per_step_time: 1413ms, lr: 4.482907e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:18,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.66090 samples/s/p 0:29:05 } +2024-07-30 05:41:21,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1892/ 3125], loss: 0.427, per_step_time: 1413ms, lr: 4.4686226e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:21,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.65973 samples/s/p 0:29:02 } +2024-07-30 05:41:24,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1894/ 3125], loss: 0.375, per_step_time: 1414ms, lr: 4.4543594e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:24,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.65750 samples/s/p 0:29:00 } +2024-07-30 05:41:26,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1896/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 4.440114e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:26,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.65996 samples/s/p 0:28:57 } +2024-07-30 05:41:29,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1898/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 4.4258923e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:29,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.65890 samples/s/p 0:28:54 } +2024-07-30 05:41:32,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1900/ 3125], loss: 0.282, per_step_time: 1425ms, lr: 4.4116854e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:32,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.61396 samples/s/p 0:29:05 } +2024-07-30 05:41:35,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1902/ 3125], loss: 0.268, per_step_time: 1413ms, lr: 4.3975083e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:35,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.66074 samples/s/p 0:28:48 } +2024-07-30 05:41:38,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1904/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 4.3833552e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:38,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.65983 samples/s/p 0:28:45 } +2024-07-30 05:41:41,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1906/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 4.369217e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:41,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.66085 samples/s/p 0:28:42 } +2024-07-30 05:41:43,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1908/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 4.3550997e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:43,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.66049 samples/s/p 0:28:39 } +2024-07-30 05:41:46,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1910/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 4.3410122e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:46,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.66134 samples/s/p 0:28:36 } +2024-07-30 05:41:49,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1912/ 3125], loss: 0.141, per_step_time: 1413ms, lr: 4.3269455e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:49,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.66083 samples/s/p 0:28:34 } +2024-07-30 05:41:52,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1914/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 4.3128907e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:52,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.66129 samples/s/p 0:28:31 } +2024-07-30 05:41:55,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1916/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 4.2988657e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:55,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.66012 samples/s/p 0:28:28 } +2024-07-30 05:41:58,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1918/ 3125], loss: 0.416, per_step_time: 1413ms, lr: 4.2848615e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:58,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.66114 samples/s/p 0:28:25 } +2024-07-30 05:42:00,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1920/ 3125], loss: 0.474, per_step_time: 1413ms, lr: 4.2708783e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:00,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.66147 samples/s/p 0:28:22 } +2024-07-30 05:42:03,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1922/ 3125], loss: 0.104, per_step_time: 1413ms, lr: 4.2569218e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:03,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.66061 samples/s/p 0:28:20 } +2024-07-30 05:42:06,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1924/ 3125], loss: 0.437, per_step_time: 1413ms, lr: 4.2429835e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:06,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.66100 samples/s/p 0:28:17 } +2024-07-30 05:42:09,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1926/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 4.2290628e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:09,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.65811 samples/s/p 0:28:15 } +2024-07-30 05:42:12,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1928/ 3125], loss: 0.454, per_step_time: 1413ms, lr: 4.215169e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:12,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.66048 samples/s/p 0:28:11 } +2024-07-30 05:42:15,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1930/ 3125], loss: 0.215, per_step_time: 1412ms, lr: 4.20129e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:15,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.66239 samples/s/p 0:28:08 } +2024-07-30 05:42:17,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1932/ 3125], loss: 0.346, per_step_time: 1413ms, lr: 4.1874407e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:17,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.66125 samples/s/p 0:28:05 } +2024-07-30 05:42:20,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1934/ 3125], loss: 0.110, per_step_time: 1414ms, lr: 4.1736124e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:20,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.65645 samples/s/p 0:28:04 } +2024-07-30 05:42:23,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1936/ 3125], loss: 0.433, per_step_time: 1413ms, lr: 4.159802e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:23,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.65816 samples/s/p 0:28:01 } +2024-07-30 05:42:26,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1938/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 4.1460186e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:26,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.65799 samples/s/p 0:27:58 } +2024-07-30 05:42:29,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1940/ 3125], loss: 0.112, per_step_time: 1413ms, lr: 4.132256e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:29,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.66137 samples/s/p 0:27:54 } +2024-07-30 05:42:32,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1942/ 3125], loss: 0.137, per_step_time: 1416ms, lr: 4.118514e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:32,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.64927 samples/s/p 0:27:55 } +2024-07-30 05:42:34,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1944/ 3125], loss: 0.308, per_step_time: 1414ms, lr: 4.10479e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:34,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.65736 samples/s/p 0:27:50 } +2024-07-30 05:42:37,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1946/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 4.091096e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:37,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.65934 samples/s/p 0:27:46 } +2024-07-30 05:42:40,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1948/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 4.0774196e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:40,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.66046 samples/s/p 0:27:43 } +2024-07-30 05:42:43,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1950/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 4.063761e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:43,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.65785 samples/s/p 0:27:41 } +2024-07-30 05:42:46,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1952/ 3125], loss: 0.390, per_step_time: 1413ms, lr: 4.0501297e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:46,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.65944 samples/s/p 0:27:38 } +2024-07-30 05:42:49,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1954/ 3125], loss: 0.410, per_step_time: 1413ms, lr: 4.0365188e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:49,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.66067 samples/s/p 0:27:34 } +2024-07-30 05:42:51,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1956/ 3125], loss: 0.320, per_step_time: 1412ms, lr: 4.0229318e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:51,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.66185 samples/s/p 0:27:31 } +2024-07-30 05:42:54,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1958/ 3125], loss: 0.266, per_step_time: 1412ms, lr: 4.00936e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:54,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.66185 samples/s/p 0:27:28 } +2024-07-30 05:42:57,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1960/ 3125], loss: 0.147, per_step_time: 1418ms, lr: 3.995821e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:57,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.63831 samples/s/p 0:27:32 } +2024-07-30 05:43:00,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1962/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 3.9822964e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:00,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.65957 samples/s/p 0:27:23 } +2024-07-30 05:43:03,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1964/ 3125], loss: 0.287, per_step_time: 1412ms, lr: 3.968799e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:03,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.66330 samples/s/p 0:27:20 } +2024-07-30 05:43:06,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1966/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 3.9553166e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:06,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.65929 samples/s/p 0:27:18 } +2024-07-30 05:43:08,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1968/ 3125], loss: 0.158, per_step_time: 1413ms, lr: 3.9418606e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:08,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.65958 samples/s/p 0:27:15 } +2024-07-30 05:43:11,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1970/ 3125], loss: 0.176, per_step_time: 1413ms, lr: 3.9284288e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:11,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.65969 samples/s/p 0:27:12 } +2024-07-30 05:43:14,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1972/ 3125], loss: 0.169, per_step_time: 1413ms, lr: 3.9150117e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:14,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.65965 samples/s/p 0:27:09 } +2024-07-30 05:43:17,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1974/ 3125], loss: 0.306, per_step_time: 1415ms, lr: 3.9016186e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:17,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.65275 samples/s/p 0:27:08 } +2024-07-30 05:43:20,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1976/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 3.888252e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:20,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.65936 samples/s/p 0:27:04 } +2024-07-30 05:43:23,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1978/ 3125], loss: 0.349, per_step_time: 1413ms, lr: 3.874904e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:23,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.65944 samples/s/p 0:27:01 } +2024-07-30 05:43:25,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1980/ 3125], loss: 0.322, per_step_time: 1412ms, lr: 3.8615792e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:25,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.66197 samples/s/p 0:26:57 } +2024-07-30 05:43:28,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1982/ 3125], loss: 0.388, per_step_time: 1414ms, lr: 3.8482784e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:28,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.65666 samples/s/p 0:26:56 } +2024-07-30 05:43:31,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1984/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 3.8349955e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:31,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.65981 samples/s/p 0:26:52 } +2024-07-30 05:43:34,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1986/ 3125], loss: 0.249, per_step_time: 1416ms, lr: 3.8217425e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:34,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.64842 samples/s/p 0:26:53 } +2024-07-30 05:43:37,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1988/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 3.8085014e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:37,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.66086 samples/s/p 0:26:46 } +2024-07-30 05:43:40,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1990/ 3125], loss: 0.203, per_step_time: 1415ms, lr: 3.795287e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:40,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.65331 samples/s/p 0:26:46 } +2024-07-30 05:43:42,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1992/ 3125], loss: 0.162, per_step_time: 1412ms, lr: 3.7820934e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:42,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.66331 samples/s/p 0:26:40 } +2024-07-30 05:43:45,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1994/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 3.7689267e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:45,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.65819 samples/s/p 0:26:39 } +2024-07-30 05:43:48,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1996/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 3.755772e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:48,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |███████████████████████████████████████████ | 5.65911 samples/s/p 0:26:36 } +2024-07-30 05:43:51,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1998/ 3125], loss: 0.155, per_step_time: 1414ms, lr: 3.7426472e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:51,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |███████████████████████████████████████████ | 5.65698 samples/s/p 0:26:33 } +2024-07-30 05:43:54,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2000/ 3125], loss: 0.219, per_step_time: 1414ms, lr: 3.729546e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:54,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.65753 samples/s/p 0:26:30 } +2024-07-30 05:43:57,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2002/ 3125], loss: 0.322, per_step_time: 1414ms, lr: 3.7164597e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:57,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.65651 samples/s/p 0:26:28 } +2024-07-30 05:43:59,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2004/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 3.7034005e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:59,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.66097 samples/s/p 0:26:24 } +2024-07-30 05:44:02,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2006/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 3.690362e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:02,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.65857 samples/s/p 0:26:22 } +2024-07-30 05:44:05,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2008/ 3125], loss: 0.410, per_step_time: 1412ms, lr: 3.677347e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:05,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.66260 samples/s/p 0:26:18 } +2024-07-30 05:44:08,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2010/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 3.6643564e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:08,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.66080 samples/s/p 0:26:15 } +2024-07-30 05:44:11,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2012/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 3.6513865e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:11,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.65796 samples/s/p 0:26:13 } +2024-07-30 05:44:14,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2014/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 3.6384372e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:14,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.65971 samples/s/p 0:26:10 } +2024-07-30 05:44:16,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2016/ 3125], loss: 0.380, per_step_time: 1412ms, lr: 3.625506e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:16,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.66275 samples/s/p 0:26:06 } +2024-07-30 05:44:19,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2018/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 3.6126016e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:19,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.65827 samples/s/p 0:26:05 } +2024-07-30 05:44:22,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2020/ 3125], loss: 0.414, per_step_time: 1412ms, lr: 3.599718e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:22,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.66172 samples/s/p 0:26:01 } +2024-07-30 05:44:25,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2022/ 3125], loss: 0.103, per_step_time: 1413ms, lr: 3.5868555e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:25,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.66040 samples/s/p 0:25:58 } +2024-07-30 05:44:28,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2024/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 3.5740166e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:28,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.66155 samples/s/p 0:25:55 } +2024-07-30 05:44:31,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2026/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 3.5612015e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:31,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.66028 samples/s/p 0:25:53 } +2024-07-30 05:44:33,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2028/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 3.5484044e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:33,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.65875 samples/s/p 0:25:50 } +2024-07-30 05:44:36,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2030/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 3.535631e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:36,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.65935 samples/s/p 0:25:47 } +2024-07-30 05:44:39,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2032/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 3.5228848e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:39,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.65981 samples/s/p 0:25:44 } +2024-07-30 05:44:42,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2034/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 3.5101561e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:42,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.66015 samples/s/p 0:25:42 } +2024-07-30 05:44:45,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2036/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 3.4974514e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:45,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.65988 samples/s/p 0:25:39 } +2024-07-30 05:44:48,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2038/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 3.4847704e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:48,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.65864 samples/s/p 0:25:36 } +2024-07-30 05:44:50,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2040/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 3.4721046e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:50,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.65942 samples/s/p 0:25:33 } +2024-07-30 05:44:53,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2042/ 3125], loss: 0.288, per_step_time: 1414ms, lr: 3.4594655e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:53,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.65663 samples/s/p 0:25:31 } +2024-07-30 05:44:56,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2044/ 3125], loss: 0.271, per_step_time: 1414ms, lr: 3.446847e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:56,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.65765 samples/s/p 0:25:28 } +2024-07-30 05:44:59,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2046/ 3125], loss: 0.145, per_step_time: 1414ms, lr: 3.4342526e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:59,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.65525 samples/s/p 0:25:26 } +2024-07-30 05:45:02,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2048/ 3125], loss: 0.373, per_step_time: 1412ms, lr: 3.421682e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:02,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.66236 samples/s/p 0:25:21 } +2024-07-30 05:45:05,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2050/ 3125], loss: 0.396, per_step_time: 1413ms, lr: 3.4091323e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:05,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.65843 samples/s/p 0:25:19 } +2024-07-30 05:45:07,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2052/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 3.3966063e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:07,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.65934 samples/s/p 0:25:16 } +2024-07-30 05:45:10,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2054/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 3.3841013e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:10,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.65960 samples/s/p 0:25:13 } +2024-07-30 05:45:13,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2056/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 3.3716202e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:13,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.66060 samples/s/p 0:25:10 } +2024-07-30 05:45:16,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2058/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 3.3591598e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:16,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.65723 samples/s/p 0:25:08 } +2024-07-30 05:45:19,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2060/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 3.3467143e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:19,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.65912 samples/s/p 0:25:05 } +2024-07-30 05:45:22,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2062/ 3125], loss: 0.276, per_step_time: 1418ms, lr: 3.3342985e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:22,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.63995 samples/s/p 0:25:07 } +2024-07-30 05:45:24,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2064/ 3125], loss: 0.340, per_step_time: 1412ms, lr: 3.321907e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:24,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.66186 samples/s/p 0:24:59 } +2024-07-30 05:45:27,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2066/ 3125], loss: 0.146, per_step_time: 1412ms, lr: 3.30953e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:27,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.66177 samples/s/p 0:24:56 } +2024-07-30 05:45:30,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2068/ 3125], loss: 0.238, per_step_time: 1417ms, lr: 3.297183e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:30,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.64429 samples/s/p 0:24:58 } +2024-07-30 05:45:33,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2070/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 3.2848595e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:33,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.66018 samples/s/p 0:24:51 } +2024-07-30 05:45:36,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2072/ 3125], loss: 0.483, per_step_time: 1413ms, lr: 3.272554e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:36,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.65800 samples/s/p 0:24:48 } +2024-07-30 05:45:39,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2074/ 3125], loss: 0.392, per_step_time: 1415ms, lr: 3.2602668e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:39,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.64996 samples/s/p 0:24:48 } +2024-07-30 05:45:41,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2076/ 3125], loss: 0.204, per_step_time: 1414ms, lr: 3.248009e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:41,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.65741 samples/s/p 0:24:43 } +2024-07-30 05:45:44,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2078/ 3125], loss: 0.225, per_step_time: 1414ms, lr: 3.2357693e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:44,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.65751 samples/s/p 0:24:40 } +2024-07-30 05:45:47,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2080/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 3.2235562e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:47,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.65955 samples/s/p 0:24:37 } +2024-07-30 05:45:50,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2082/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 3.211364e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:50,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.66064 samples/s/p 0:24:34 } +2024-07-30 05:45:53,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2084/ 3125], loss: 0.415, per_step_time: 1413ms, lr: 3.19919e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:53,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.65953 samples/s/p 0:24:31 } +2024-07-30 05:45:56,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2086/ 3125], loss: 0.434, per_step_time: 1413ms, lr: 3.1870425e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:56,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.66052 samples/s/p 0:24:28 } +2024-07-30 05:45:58,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2088/ 3125], loss: 0.105, per_step_time: 1413ms, lr: 3.17491e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:58,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.66075 samples/s/p 0:24:25 } +2024-07-30 05:46:01,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2090/ 3125], loss: 0.137, per_step_time: 1412ms, lr: 3.1628102e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:01,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.66192 samples/s/p 0:24:22 } +2024-07-30 05:46:04,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2092/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 3.1507284e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:04,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.65867 samples/s/p 0:24:20 } +2024-07-30 05:46:07,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2094/ 3125], loss: 0.174, per_step_time: 1414ms, lr: 3.1386702e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:07,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.65607 samples/s/p 0:24:18 } +2024-07-30 05:46:10,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2096/ 3125], loss: 0.305, per_step_time: 1412ms, lr: 3.126633e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:10,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.66173 samples/s/p 0:24:13 } +2024-07-30 05:46:13,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2098/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 3.1146197e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:13,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.65970 samples/s/p 0:24:11 } +2024-07-30 05:46:15,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2100/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 3.1026272e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:15,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.65792 samples/s/p 0:24:09 } +2024-07-30 05:46:18,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2102/ 3125], loss: 0.392, per_step_time: 1414ms, lr: 3.0906529e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:18,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.65710 samples/s/p 0:24:06 } +2024-07-30 05:46:21,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2104/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 3.078708e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:21,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.65969 samples/s/p 0:24:03 } +2024-07-30 05:46:24,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2106/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 3.066784e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:24,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.65990 samples/s/p 0:24:00 } +2024-07-30 05:46:27,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2108/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 3.0548782e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:27,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.65895 samples/s/p 0:23:57 } +2024-07-30 05:46:30,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2110/ 3125], loss: 0.341, per_step_time: 1413ms, lr: 3.0429987e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:30,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.66015 samples/s/p 0:23:54 } +2024-07-30 05:46:32,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2112/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 3.0311435e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:32,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.65881 samples/s/p 0:23:52 } +2024-07-30 05:46:35,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2114/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 3.019309e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:35,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.65936 samples/s/p 0:23:49 } +2024-07-30 05:46:38,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2116/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 3.0074892e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:38,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.66141 samples/s/p 0:23:45 } +2024-07-30 05:46:41,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2118/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 2.9957056e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:41,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.65803 samples/s/p 0:23:43 } +2024-07-30 05:46:44,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2120/ 3125], loss: 0.374, per_step_time: 1414ms, lr: 2.9839336e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:44,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.65716 samples/s/p 0:23:41 } +2024-07-30 05:46:47,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2122/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 2.9721915e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:47,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.65833 samples/s/p 0:23:38 } +2024-07-30 05:46:49,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2124/ 3125], loss: 0.254, per_step_time: 1412ms, lr: 2.9604672e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:49,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.66230 samples/s/p 0:23:34 } +2024-07-30 05:46:52,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2126/ 3125], loss: 0.245, per_step_time: 1412ms, lr: 2.94877e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:52,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.66201 samples/s/p 0:23:31 } +2024-07-30 05:46:55,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2128/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 2.9370904e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:55,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.65945 samples/s/p 0:23:29 } +2024-07-30 05:46:58,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2130/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 2.9254346e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:58,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.66160 samples/s/p 0:23:25 } +2024-07-30 05:47:01,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2132/ 3125], loss: 0.417, per_step_time: 1414ms, lr: 2.9138e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:01,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.65674 samples/s/p 0:23:24 } +2024-07-30 05:47:04,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2134/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 2.9021888e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:04,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.66006 samples/s/p 0:23:20 } +2024-07-30 05:47:06,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2136/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 2.8905987e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:06,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.65846 samples/s/p 0:23:18 } +2024-07-30 05:47:09,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2138/ 3125], loss: 0.503, per_step_time: 1413ms, lr: 2.8790353e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:09,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.65851 samples/s/p 0:23:15 } +2024-07-30 05:47:12,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2140/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 2.8674899e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:12,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.65833 samples/s/p 0:23:12 } +2024-07-30 05:47:15,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2142/ 3125], loss: 0.380, per_step_time: 1414ms, lr: 2.8559742e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:15,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.65770 samples/s/p 0:23:09 } +2024-07-30 05:47:18,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2144/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 2.8444765e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:18,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.65774 samples/s/p 0:23:07 } +2024-07-30 05:47:21,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2146/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 2.8329998e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:21,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.65897 samples/s/p 0:23:03 } +2024-07-30 05:47:23,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2148/ 3125], loss: 0.317, per_step_time: 1414ms, lr: 2.8215436e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:23,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.65758 samples/s/p 0:23:01 } +2024-07-30 05:47:26,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2150/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 2.8101147e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:26,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.65979 samples/s/p 0:22:58 } +2024-07-30 05:47:26,827 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 05:48:03,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2152/ 3125], loss: 0.418, per_step_time: 2169ms, lr: 2.7987033e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:03,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 3.68803 samples/s/p 0:35:10 } +2024-07-30 05:48:06,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2154/ 3125], loss: 0.273, per_step_time: 1412ms, lr: 2.7873187e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:06,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.66208 samples/s/p 0:22:51 } +2024-07-30 05:48:08,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2156/ 3125], loss: 0.291, per_step_time: 1413ms, lr: 2.7759552e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:08,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.65949 samples/s/p 0:22:49 } +2024-07-30 05:48:11,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2158/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 2.7646155e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:11,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.65911 samples/s/p 0:22:47 } +2024-07-30 05:48:14,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2160/ 3125], loss: 0.600, per_step_time: 1413ms, lr: 2.7532965e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:14,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.65949 samples/s/p 0:22:44 } +2024-07-30 05:48:17,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2162/ 3125], loss: 0.405, per_step_time: 1413ms, lr: 2.7420015e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:17,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.65775 samples/s/p 0:22:41 } +2024-07-30 05:48:20,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2164/ 3125], loss: 0.299, per_step_time: 1414ms, lr: 2.7307271e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:20,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.65633 samples/s/p 0:22:39 } +2024-07-30 05:48:23,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2166/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 2.7194767e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:23,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.65984 samples/s/p 0:22:35 } +2024-07-30 05:48:25,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2168/ 3125], loss: 0.133, per_step_time: 1414ms, lr: 2.7082532e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:25,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.65496 samples/s/p 0:22:33 } +2024-07-30 05:48:28,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2170/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 2.6970474e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:28,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.65632 samples/s/p 0:22:30 } +2024-07-30 05:48:31,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2172/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 2.6858626e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:31,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.65783 samples/s/p 0:22:27 } +2024-07-30 05:48:34,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2174/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 2.6747017e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:34,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.66055 samples/s/p 0:22:24 } +2024-07-30 05:48:37,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2176/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 2.6635615e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:37,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.66092 samples/s/p 0:22:21 } +2024-07-30 05:48:40,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2178/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 2.6524512e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:40,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.65914 samples/s/p 0:22:18 } +2024-07-30 05:48:42,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2180/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 2.641356e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:42,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.66063 samples/s/p 0:22:15 } +2024-07-30 05:48:45,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2182/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 2.6302874e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:45,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.65945 samples/s/p 0:22:12 } +2024-07-30 05:48:48,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2184/ 3125], loss: 0.419, per_step_time: 1413ms, lr: 2.6192455e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:48,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |████████████████████████████████████████████ | 5.65955 samples/s/p 0:22:10 } +2024-07-30 05:48:51,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2186/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 2.6082188e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:51,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |████████████████████████████████████████████ | 5.65959 samples/s/p 0:22:07 } +2024-07-30 05:48:54,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2188/ 3125], loss: 0.160, per_step_time: 1415ms, lr: 2.5972128e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:54,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.65301 samples/s/p 0:22:06 } +2024-07-30 05:48:57,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2190/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 2.5862366e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:57,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.65899 samples/s/p 0:22:01 } +2024-07-30 05:48:59,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2192/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 2.5752811e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:59,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.66114 samples/s/p 0:21:58 } +2024-07-30 05:49:02,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2194/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 2.5643467e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:02,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.66025 samples/s/p 0:21:55 } +2024-07-30 05:49:05,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2196/ 3125], loss: 0.307, per_step_time: 1412ms, lr: 2.553433e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:05,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.66179 samples/s/p 0:21:52 } +2024-07-30 05:49:08,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2198/ 3125], loss: 0.243, per_step_time: 1414ms, lr: 2.5425493e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:08,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.65510 samples/s/p 0:21:51 } +2024-07-30 05:49:11,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2200/ 3125], loss: 0.187, per_step_time: 1414ms, lr: 2.5316834e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:11,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.65715 samples/s/p 0:21:48 } +2024-07-30 05:49:14,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2202/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 2.5208382e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:14,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.65868 samples/s/p 0:21:44 } +2024-07-30 05:49:16,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2204/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 2.5100172e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:16,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.66016 samples/s/p 0:21:41 } +2024-07-30 05:49:19,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2206/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 2.4992198e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:19,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.66073 samples/s/p 0:21:38 } +2024-07-30 05:49:22,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2208/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 2.4884463e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:22,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.65975 samples/s/p 0:21:36 } +2024-07-30 05:49:25,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2210/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 2.4776935e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:25,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.65980 samples/s/p 0:21:33 } +2024-07-30 05:49:28,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2212/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 2.4669646e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:28,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.66025 samples/s/p 0:21:30 } +2024-07-30 05:49:31,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2214/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 2.4562596e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:31,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.65874 samples/s/p 0:21:27 } +2024-07-30 05:49:33,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2216/ 3125], loss: 0.425, per_step_time: 1414ms, lr: 2.4455724e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:33,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.65648 samples/s/p 0:21:25 } +2024-07-30 05:49:36,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2218/ 3125], loss: 0.370, per_step_time: 1415ms, lr: 2.4349092e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:36,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.65306 samples/s/p 0:21:23 } +2024-07-30 05:49:39,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2220/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 2.424267e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:39,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.66162 samples/s/p 0:21:18 } +2024-07-30 05:49:42,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2222/ 3125], loss: 0.233, per_step_time: 1414ms, lr: 2.4136511e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:42,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.65495 samples/s/p 0:21:17 } +2024-07-30 05:49:45,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2224/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 2.4030626e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:45,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.65975 samples/s/p 0:21:13 } +2024-07-30 05:49:48,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2226/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 2.3924918e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:48,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.66002 samples/s/p 0:21:10 } +2024-07-30 05:49:50,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2228/ 3125], loss: 0.080, per_step_time: 1413ms, lr: 2.3819446e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:50,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.66076 samples/s/p 0:21:07 } +2024-07-30 05:49:53,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2230/ 3125], loss: 0.273, per_step_time: 1412ms, lr: 2.3714185e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:53,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.66240 samples/s/p 0:21:04 } +2024-07-30 05:49:56,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2232/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 2.3609131e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:56,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.66127 samples/s/p 0:21:01 } +2024-07-30 05:49:59,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2234/ 3125], loss: 0.201, per_step_time: 1412ms, lr: 2.3504346e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:59,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.66220 samples/s/p 0:20:58 } +2024-07-30 05:50:02,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2236/ 3125], loss: 0.298, per_step_time: 1412ms, lr: 2.339977e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:02,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.66291 samples/s/p 0:20:55 } +2024-07-30 05:50:05,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2238/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 2.3295432e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:05,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.65800 samples/s/p 0:20:54 } +2024-07-30 05:50:07,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2240/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 2.3191302e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:07,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.66107 samples/s/p 0:20:50 } +2024-07-30 05:50:10,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2242/ 3125], loss: 0.452, per_step_time: 1413ms, lr: 2.3087412e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:10,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.65816 samples/s/p 0:20:48 } +2024-07-30 05:50:13,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2244/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 2.298379e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:13,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.66013 samples/s/p 0:20:45 } +2024-07-30 05:50:16,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2246/ 3125], loss: 0.451, per_step_time: 1413ms, lr: 2.2880344e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:16,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.65963 samples/s/p 0:20:42 } +2024-07-30 05:50:19,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2248/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 2.277714e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:19,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.66022 samples/s/p 0:20:39 } +2024-07-30 05:50:22,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2250/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 2.2674172e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:22,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.65880 samples/s/p 0:20:37 } +2024-07-30 05:50:24,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2252/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 2.2571385e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:24,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.65947 samples/s/p 0:20:34 } +2024-07-30 05:50:27,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2254/ 3125], loss: 0.231, per_step_time: 1414ms, lr: 2.2468895e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:27,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.65735 samples/s/p 0:20:31 } +2024-07-30 05:50:30,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2256/ 3125], loss: 0.151, per_step_time: 1413ms, lr: 2.2366582e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:30,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.66126 samples/s/p 0:20:27 } +2024-07-30 05:50:33,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2258/ 3125], loss: 0.187, per_step_time: 1414ms, lr: 2.226451e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:33,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.65689 samples/s/p 0:20:26 } +2024-07-30 05:50:36,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2260/ 3125], loss: 0.350, per_step_time: 1414ms, lr: 2.2162705e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:36,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.65646 samples/s/p 0:20:23 } +2024-07-30 05:50:39,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2262/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 2.2061108e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:39,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.65800 samples/s/p 0:20:20 } +2024-07-30 05:50:41,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2264/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 2.1959691e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:41,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.66098 samples/s/p 0:20:16 } +2024-07-30 05:50:44,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2266/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 2.1858513e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:44,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.66136 samples/s/p 0:20:13 } +2024-07-30 05:50:47,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2268/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 2.1757631e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:47,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.65831 samples/s/p 0:20:11 } +2024-07-30 05:50:50,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2270/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 2.165693e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:50,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.65953 samples/s/p 0:20:08 } +2024-07-30 05:50:53,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2272/ 3125], loss: 0.159, per_step_time: 1414ms, lr: 2.1556467e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:53,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.65605 samples/s/p 0:20:06 } +2024-07-30 05:50:56,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2274/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 2.145627e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:56,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.65845 samples/s/p 0:20:03 } +2024-07-30 05:50:58,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2276/ 3125], loss: 0.102, per_step_time: 1414ms, lr: 2.1356195e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:58,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.65732 samples/s/p 0:20:00 } +2024-07-30 05:51:01,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2278/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 2.1256416e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:01,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.65840 samples/s/p 0:19:57 } +2024-07-30 05:51:04,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2280/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 2.1156906e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:04,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.65758 samples/s/p 0:19:54 } +2024-07-30 05:51:07,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2282/ 3125], loss: 0.166, per_step_time: 1415ms, lr: 2.1057605e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:07,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.65236 samples/s/p 0:19:53 } +2024-07-30 05:51:10,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2284/ 3125], loss: 0.233, per_step_time: 1415ms, lr: 2.0958453e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:10,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.65257 samples/s/p 0:19:50 } +2024-07-30 05:51:13,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2286/ 3125], loss: 0.250, per_step_time: 1414ms, lr: 2.0859599e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:13,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.65524 samples/s/p 0:19:46 } +2024-07-30 05:51:15,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2288/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 2.0760953e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:15,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.65940 samples/s/p 0:19:43 } +2024-07-30 05:51:18,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2290/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 2.0662516e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:18,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.65851 samples/s/p 0:19:40 } +2024-07-30 05:51:21,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2292/ 3125], loss: 0.436, per_step_time: 1413ms, lr: 2.0564347e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:21,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.65839 samples/s/p 0:19:37 } +2024-07-30 05:51:24,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2294/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 2.0466386e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:24,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.66137 samples/s/p 0:19:34 } +2024-07-30 05:51:27,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2296/ 3125], loss: 0.166, per_step_time: 1415ms, lr: 2.0368695e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:27,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.65028 samples/s/p 0:19:33 } +2024-07-30 05:51:30,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2298/ 3125], loss: 0.158, per_step_time: 1412ms, lr: 2.0271182e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:30,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.66187 samples/s/p 0:19:28 } +2024-07-30 05:51:32,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2300/ 3125], loss: 0.330, per_step_time: 1412ms, lr: 2.0173967e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:32,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.66220 samples/s/p 0:19:25 } +2024-07-30 05:51:35,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2302/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 2.007693e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:35,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.65836 samples/s/p 0:19:23 } +2024-07-30 05:51:38,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2304/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 1.9980102e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:38,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.66121 samples/s/p 0:19:20 } +2024-07-30 05:51:41,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2306/ 3125], loss: 0.122, per_step_time: 1413ms, lr: 1.9883512e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:41,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.66133 samples/s/p 0:19:17 } +2024-07-30 05:51:44,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2308/ 3125], loss: 0.206, per_step_time: 1412ms, lr: 1.9787161e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:44,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.66172 samples/s/p 0:19:14 } +2024-07-30 05:51:47,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2310/ 3125], loss: 0.457, per_step_time: 1412ms, lr: 1.969102e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:47,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.66174 samples/s/p 0:19:11 } +2024-07-30 05:51:49,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2312/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 1.9595146e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:49,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.65975 samples/s/p 0:19:09 } +2024-07-30 05:51:52,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2314/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 1.949951e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:52,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.66092 samples/s/p 0:19:06 } +2024-07-30 05:51:55,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2316/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 1.9404054e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:55,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.66051 samples/s/p 0:19:03 } +2024-07-30 05:51:58,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2318/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 1.9308835e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:58,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.65865 samples/s/p 0:19:00 } +2024-07-30 05:52:01,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2320/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 1.9213884e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:01,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.65784 samples/s/p 0:18:58 } +2024-07-30 05:52:04,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2322/ 3125], loss: 0.131, per_step_time: 1414ms, lr: 1.9119173e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:04,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.65461 samples/s/p 0:18:56 } +2024-07-30 05:52:06,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2324/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 1.902464e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:06,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.65986 samples/s/p 0:18:52 } +2024-07-30 05:52:09,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2326/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 1.8930375e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:09,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.66015 samples/s/p 0:18:49 } +2024-07-30 05:52:12,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2328/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 1.8836319e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:12,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.66114 samples/s/p 0:18:46 } +2024-07-30 05:52:15,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2330/ 3125], loss: 0.352, per_step_time: 1412ms, lr: 1.8742502e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:15,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.66193 samples/s/p 0:18:43 } +2024-07-30 05:52:18,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2332/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 1.8648892e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:18,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.65911 samples/s/p 0:18:41 } +2024-07-30 05:52:21,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2334/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 1.8555491e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:21,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.65960 samples/s/p 0:18:38 } +2024-07-30 05:52:23,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2336/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 1.8462389e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:23,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.65924 samples/s/p 0:18:35 } +2024-07-30 05:52:26,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2338/ 3125], loss: 0.314, per_step_time: 1414ms, lr: 1.8369495e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:26,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.65732 samples/s/p 0:18:32 } +2024-07-30 05:52:29,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2340/ 3125], loss: 0.076, per_step_time: 1413ms, lr: 1.827684e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:29,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.66092 samples/s/p 0:18:29 } +2024-07-30 05:52:32,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2342/ 3125], loss: 0.252, per_step_time: 1414ms, lr: 1.8184393e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:32,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.65462 samples/s/p 0:18:27 } +2024-07-30 05:52:35,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2344/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 1.8092155e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:35,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.65808 samples/s/p 0:18:24 } +2024-07-30 05:52:38,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2346/ 3125], loss: 0.045, per_step_time: 1413ms, lr: 1.8000215e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:38,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.65942 samples/s/p 0:18:21 } +2024-07-30 05:52:40,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2348/ 3125], loss: 0.177, per_step_time: 1414ms, lr: 1.7908394e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:40,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.65584 samples/s/p 0:18:19 } +2024-07-30 05:52:43,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2350/ 3125], loss: 0.268, per_step_time: 1414ms, lr: 1.78169e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:43,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.65727 samples/s/p 0:18:15 } +2024-07-30 05:52:46,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2352/ 3125], loss: 0.405, per_step_time: 1413ms, lr: 1.7725617e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:46,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.65910 samples/s/p 0:18:12 } +2024-07-30 05:52:49,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2354/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 1.7634571e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:49,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.65985 samples/s/p 0:18:09 } +2024-07-30 05:52:52,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2356/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 1.7543672e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:52,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.65960 samples/s/p 0:18:07 } +2024-07-30 05:52:55,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2358/ 3125], loss: 0.144, per_step_time: 1414ms, lr: 1.7453104e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:55,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.65670 samples/s/p 0:18:04 } +2024-07-30 05:52:57,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2360/ 3125], loss: 0.342, per_step_time: 1414ms, lr: 1.7362743e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:57,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.65758 samples/s/p 0:18:01 } +2024-07-30 05:53:00,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2362/ 3125], loss: 0.292, per_step_time: 1414ms, lr: 1.7272562e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:00,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.65628 samples/s/p 0:17:59 } +2024-07-30 05:53:03,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2364/ 3125], loss: 0.434, per_step_time: 1413ms, lr: 1.7182677e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:03,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.65866 samples/s/p 0:17:55 } +2024-07-30 05:53:06,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2366/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 1.7093032e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:06,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.66069 samples/s/p 0:17:52 } +2024-07-30 05:53:09,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2368/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 1.7003566e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:09,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.66007 samples/s/p 0:17:49 } +2024-07-30 05:53:12,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2370/ 3125], loss: 0.115, per_step_time: 1412ms, lr: 1.6914368e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:12,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.66195 samples/s/p 0:17:46 } +2024-07-30 05:53:14,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2372/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 1.6825408e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:14,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |█████████████████████████████████████████████ | 5.66109 samples/s/p 0:17:44 } +2024-07-30 05:53:17,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2374/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 1.6736627e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:17,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |█████████████████████████████████████████████ | 5.65907 samples/s/p 0:17:41 } +2024-07-30 05:53:20,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2376/ 3125], loss: 0.204, per_step_time: 1412ms, lr: 1.6648083e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:20,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.66179 samples/s/p 0:17:38 } +2024-07-30 05:53:23,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2378/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 1.655975e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:23,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.65999 samples/s/p 0:17:35 } +2024-07-30 05:53:26,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2380/ 3125], loss: 0.391, per_step_time: 1413ms, lr: 1.6471714e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:26,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.66060 samples/s/p 0:17:32 } +2024-07-30 05:53:29,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2382/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 1.6383856e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:29,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.66161 samples/s/p 0:17:29 } +2024-07-30 05:53:31,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2384/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 1.6296268e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:31,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.66110 samples/s/p 0:17:27 } +2024-07-30 05:53:34,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2386/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 1.6208917e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:34,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.65876 samples/s/p 0:17:24 } +2024-07-30 05:53:37,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2388/ 3125], loss: 0.043, per_step_time: 1413ms, lr: 1.6121744e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:37,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.65971 samples/s/p 0:17:21 } +2024-07-30 05:53:40,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2390/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 1.603484e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:40,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.65919 samples/s/p 0:17:19 } +2024-07-30 05:53:43,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2392/ 3125], loss: 0.164, per_step_time: 1414ms, lr: 1.5948176e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:43,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.65686 samples/s/p 0:17:16 } +2024-07-30 05:53:46,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2394/ 3125], loss: 0.124, per_step_time: 1414ms, lr: 1.586169e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:46,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.65707 samples/s/p 0:17:13 } +2024-07-30 05:53:48,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2396/ 3125], loss: 0.369, per_step_time: 1414ms, lr: 1.5775501e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:48,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.65751 samples/s/p 0:17:10 } +2024-07-30 05:53:51,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2398/ 3125], loss: 0.399, per_step_time: 1414ms, lr: 1.5689491e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:51,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.65656 samples/s/p 0:17:08 } +2024-07-30 05:53:54,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2400/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 1.560378e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:54,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.66118 samples/s/p 0:17:04 } +2024-07-30 05:53:57,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2402/ 3125], loss: 0.127, per_step_time: 1414ms, lr: 1.5518218e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:57,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.65752 samples/s/p 0:17:02 } +2024-07-30 05:54:00,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2404/ 3125], loss: 0.141, per_step_time: 1414ms, lr: 1.5432924e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:00,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.65737 samples/s/p 0:16:59 } +2024-07-30 05:54:03,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2406/ 3125], loss: 0.215, per_step_time: 1414ms, lr: 1.5347868e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:03,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.65731 samples/s/p 0:16:56 } +2024-07-30 05:54:05,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2408/ 3125], loss: 0.337, per_step_time: 1415ms, lr: 1.5263021e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:05,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.65363 samples/s/p 0:16:54 } +2024-07-30 05:54:08,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2410/ 3125], loss: 0.340, per_step_time: 1414ms, lr: 1.5178442e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:08,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.65667 samples/s/p 0:16:51 } +2024-07-30 05:54:11,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2412/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 1.509407e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:11,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.65788 samples/s/p 0:16:48 } +2024-07-30 05:54:14,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2414/ 3125], loss: 0.275, per_step_time: 1414ms, lr: 1.5009999e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:14,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.65720 samples/s/p 0:16:45 } +2024-07-30 05:54:17,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2416/ 3125], loss: 0.377, per_step_time: 1413ms, lr: 1.4926076e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:17,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.66046 samples/s/p 0:16:42 } +2024-07-30 05:54:20,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2418/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 1.4842361e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:20,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.65912 samples/s/p 0:16:39 } +2024-07-30 05:54:22,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2420/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 1.4758915e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:22,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.66093 samples/s/p 0:16:36 } +2024-07-30 05:54:25,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2422/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 1.4675706e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:25,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.66036 samples/s/p 0:16:33 } +2024-07-30 05:54:28,660 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2424/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 1.4592736e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:28,660 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.66018 samples/s/p 0:16:30 } +2024-07-30 05:54:31,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2426/ 3125], loss: 0.215, per_step_time: 1412ms, lr: 1.4509976e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:31,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.66203 samples/s/p 0:16:27 } +2024-07-30 05:54:34,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2428/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 1.4427512e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:34,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.66017 samples/s/p 0:16:25 } +2024-07-30 05:54:37,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2430/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 1.4345228e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:37,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.66166 samples/s/p 0:16:22 } +2024-07-30 05:54:39,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2432/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 1.4263212e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:39,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.65914 samples/s/p 0:16:19 } +2024-07-30 05:54:42,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2434/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 1.4181346e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:42,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.65995 samples/s/p 0:16:16 } +2024-07-30 05:54:45,660 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2436/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 1.4099747e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:45,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.66080 samples/s/p 0:16:13 } +2024-07-30 05:54:48,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2438/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 1.4018386e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:48,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.66077 samples/s/p 0:16:10 } +2024-07-30 05:54:51,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2440/ 3125], loss: 0.349, per_step_time: 1413ms, lr: 1.3937324e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:51,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.65839 samples/s/p 0:16:08 } +2024-07-30 05:54:54,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2442/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 1.385638e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:54,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.65863 samples/s/p 0:16:05 } +2024-07-30 05:54:56,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2444/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 1.3775735e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:56,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.65967 samples/s/p 0:16:02 } +2024-07-30 05:54:59,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2446/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 1.3695359e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:59,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.65848 samples/s/p 0:15:59 } +2024-07-30 05:55:02,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2448/ 3125], loss: 0.274, per_step_time: 1414ms, lr: 1.3615131e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:02,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.65742 samples/s/p 0:15:57 } +2024-07-30 05:55:05,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2450/ 3125], loss: 0.194, per_step_time: 1418ms, lr: 1.3535141e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:05,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.63905 samples/s/p 0:15:57 } +2024-07-30 05:55:08,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2452/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 1.345545e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:08,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.65950 samples/s/p 0:15:51 } +2024-07-30 05:55:11,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2454/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 1.3375967e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:11,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.65791 samples/s/p 0:15:48 } +2024-07-30 05:55:14,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2456/ 3125], loss: 0.244, per_step_time: 1414ms, lr: 1.3296693e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:14,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.65685 samples/s/p 0:15:46 } +2024-07-30 05:55:16,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2458/ 3125], loss: 0.178, per_step_time: 1415ms, lr: 1.3217628e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:16,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.65186 samples/s/p 0:15:44 } +2024-07-30 05:55:19,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2460/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 1.313889e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:19,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.66046 samples/s/p 0:15:39 } +2024-07-30 05:55:22,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2462/ 3125], loss: 0.099, per_step_time: 1413ms, lr: 1.3060301e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:22,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.66109 samples/s/p 0:15:36 } +2024-07-30 05:55:25,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2464/ 3125], loss: 0.348, per_step_time: 1413ms, lr: 1.2981981e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:25,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.66033 samples/s/p 0:15:34 } +2024-07-30 05:55:28,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2466/ 3125], loss: 0.240, per_step_time: 1414ms, lr: 1.290381e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:28,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.65696 samples/s/p 0:15:31 } +2024-07-30 05:55:31,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2468/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 1.2825936e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:31,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.66132 samples/s/p 0:15:28 } +2024-07-30 05:55:33,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2470/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 1.274833e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:33,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.65891 samples/s/p 0:15:25 } +2024-07-30 05:55:36,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2472/ 3125], loss: 0.237, per_step_time: 1414ms, lr: 1.2670934e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:36,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.65582 samples/s/p 0:15:23 } +2024-07-30 05:55:39,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2474/ 3125], loss: 0.373, per_step_time: 1413ms, lr: 1.2593746e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:39,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.65819 samples/s/p 0:15:20 } +2024-07-30 05:55:42,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2476/ 3125], loss: 0.178, per_step_time: 1414ms, lr: 1.2516796e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:42,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.65768 samples/s/p 0:15:17 } +2024-07-30 05:55:45,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2478/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 1.2440115e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:45,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.65998 samples/s/p 0:15:14 } +2024-07-30 05:55:48,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2480/ 3125], loss: 0.105, per_step_time: 1413ms, lr: 1.2363672e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:48,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.65830 samples/s/p 0:15:11 } +2024-07-30 05:55:50,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2482/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 1.2287408e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:50,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.66053 samples/s/p 0:15:08 } +2024-07-30 05:55:53,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2484/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 1.2211382e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:53,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.65806 samples/s/p 0:15:06 } +2024-07-30 05:55:56,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2486/ 3125], loss: 0.445, per_step_time: 1413ms, lr: 1.2135625e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:56,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.66002 samples/s/p 0:15:03 } +2024-07-30 05:55:59,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2488/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 1.2060076e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:59,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.66036 samples/s/p 0:15:00 } +2024-07-30 05:56:02,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2490/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 1.1984795e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:02,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.66141 samples/s/p 0:14:57 } +2024-07-30 05:56:05,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2492/ 3125], loss: 0.110, per_step_time: 1413ms, lr: 1.1909723e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:05,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.65983 samples/s/p 0:14:54 } +2024-07-30 05:56:07,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2494/ 3125], loss: 0.096, per_step_time: 1413ms, lr: 1.18348595e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:07,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.66006 samples/s/p 0:14:51 } +2024-07-30 05:56:10,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2496/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 1.1760235e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:10,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.65826 samples/s/p 0:14:49 } +2024-07-30 05:56:13,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2498/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 1.1685848e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:13,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.66008 samples/s/p 0:14:46 } +2024-07-30 05:56:16,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2500/ 3125], loss: 0.334, per_step_time: 1414ms, lr: 1.1611759e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:16,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.65629 samples/s/p 0:14:43 } +2024-07-30 05:56:19,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2502/ 3125], loss: 0.413, per_step_time: 1415ms, lr: 1.153782e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:19,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.65181 samples/s/p 0:14:41 } +2024-07-30 05:56:22,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2504/ 3125], loss: 0.376, per_step_time: 1413ms, lr: 1.14641786e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:22,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.66073 samples/s/p 0:14:37 } +2024-07-30 05:56:24,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2506/ 3125], loss: 0.242, per_step_time: 1412ms, lr: 1.13907156e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:24,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.66193 samples/s/p 0:14:34 } +2024-07-30 05:56:27,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2508/ 3125], loss: 0.164, per_step_time: 1413ms, lr: 1.1317521e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:27,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.66105 samples/s/p 0:14:31 } +2024-07-30 05:56:30,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2510/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 1.1244505e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:30,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.65997 samples/s/p 0:14:29 } +2024-07-30 05:56:33,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2512/ 3125], loss: 0.341, per_step_time: 1414ms, lr: 1.11717874e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:33,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.65671 samples/s/p 0:14:26 } +2024-07-30 05:56:36,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2514/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 1.1099249e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:36,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.65932 samples/s/p 0:14:23 } +2024-07-30 05:56:39,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2516/ 3125], loss: 0.254, per_step_time: 1414ms, lr: 1.1027008e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:39,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.65695 samples/s/p 0:14:21 } +2024-07-30 05:56:41,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2518/ 3125], loss: 0.192, per_step_time: 1415ms, lr: 1.0954946e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:41,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.65291 samples/s/p 0:14:19 } +2024-07-30 05:56:44,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2520/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 1.0883152e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:44,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.66152 samples/s/p 0:14:14 } +2024-07-30 05:56:47,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2522/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 1.0811567e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:47,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.65909 samples/s/p 0:14:12 } +2024-07-30 05:56:50,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2524/ 3125], loss: 0.348, per_step_time: 1412ms, lr: 1.074025e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:50,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.66192 samples/s/p 0:14:09 } +2024-07-30 05:56:53,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2526/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 1.0669142e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:53,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.66104 samples/s/p 0:14:06 } +2024-07-30 05:56:56,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2528/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 1.0598272e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:56,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.65843 samples/s/p 0:14:04 } +2024-07-30 05:56:58,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2530/ 3125], loss: 0.130, per_step_time: 1413ms, lr: 1.0527551e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:58,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.66134 samples/s/p 0:14:00 } +2024-07-30 05:57:01,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2532/ 3125], loss: 0.062, per_step_time: 1412ms, lr: 1.04571576e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:01,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.66174 samples/s/p 0:13:57 } +2024-07-30 05:57:04,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2534/ 3125], loss: 0.364, per_step_time: 1414ms, lr: 1.0387033e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:04,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.65567 samples/s/p 0:13:55 } +2024-07-30 05:57:07,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2536/ 3125], loss: 0.319, per_step_time: 1412ms, lr: 1.0317057e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:07,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.66242 samples/s/p 0:13:52 } +2024-07-30 05:57:10,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2538/ 3125], loss: 0.071, per_step_time: 1415ms, lr: 1.0247349e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:10,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.65133 samples/s/p 0:13:50 } +2024-07-30 05:57:13,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2540/ 3125], loss: 0.294, per_step_time: 1413ms, lr: 1.017788e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:13,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.65829 samples/s/p 0:13:47 } +2024-07-30 05:57:15,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2542/ 3125], loss: 0.164, per_step_time: 1414ms, lr: 1.0108679e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:15,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.65471 samples/s/p 0:13:44 } +2024-07-30 05:57:18,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2544/ 3125], loss: 0.389, per_step_time: 1414ms, lr: 1.0039687e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:18,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.65761 samples/s/p 0:13:41 } +2024-07-30 05:57:21,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2546/ 3125], loss: 0.241, per_step_time: 1412ms, lr: 9.9709034e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:21,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.66256 samples/s/p 0:13:38 } +2024-07-30 05:57:24,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2548/ 3125], loss: 0.436, per_step_time: 1414ms, lr: 9.902358e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:24,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.65726 samples/s/p 0:13:35 } +2024-07-30 05:57:27,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2550/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 9.834021e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:27,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.66030 samples/s/p 0:13:32 } +2024-07-30 05:57:30,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2552/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 9.765982e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:30,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.65927 samples/s/p 0:13:29 } +2024-07-30 05:57:32,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2554/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 9.6981225e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:32,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.66080 samples/s/p 0:13:26 } +2024-07-30 05:57:35,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2556/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 9.630531e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:35,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.66057 samples/s/p 0:13:24 } +2024-07-30 05:57:38,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2558/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 9.5631776e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:38,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.65967 samples/s/p 0:13:21 } +2024-07-30 05:57:41,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2560/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 9.4960626e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:41,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.66074 samples/s/p 0:13:18 } +2024-07-30 05:57:44,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2562/ 3125], loss: 0.318, per_step_time: 1426ms, lr: 9.429186e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:44,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.60913 samples/s/p 0:13:22 } +2024-07-30 05:57:47,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2564/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 9.362459e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:47,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |███████████████████████████████████████████████ | 5.66065 samples/s/p 0:13:12 } +2024-07-30 05:57:49,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2566/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 9.29603e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:49,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |███████████████████████████████████████████████ | 5.65945 samples/s/p 0:13:10 } +2024-07-30 05:57:52,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2568/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 9.2298386e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:52,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.65638 samples/s/p 0:13:07 } +2024-07-30 05:57:55,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2570/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 9.163886e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:55,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.66062 samples/s/p 0:13:04 } +2024-07-30 05:57:58,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2572/ 3125], loss: 0.212, per_step_time: 1414ms, lr: 9.098202e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:58,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.65562 samples/s/p 0:13:02 } +2024-07-30 05:58:01,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2574/ 3125], loss: 0.321, per_step_time: 1413ms, lr: 9.032637e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:01,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.65821 samples/s/p 0:12:59 } +2024-07-30 05:58:04,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2576/ 3125], loss: 0.447, per_step_time: 1414ms, lr: 8.9674295e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:04,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.65758 samples/s/p 0:12:56 } +2024-07-30 05:58:06,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2578/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 8.9024006e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:06,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.66000 samples/s/p 0:12:53 } +2024-07-30 05:58:09,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2580/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 8.83764e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:09,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.66071 samples/s/p 0:12:50 } +2024-07-30 05:58:12,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2582/ 3125], loss: 0.219, per_step_time: 1414ms, lr: 8.7730584e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:12,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.65757 samples/s/p 0:12:47 } +2024-07-30 05:58:15,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2584/ 3125], loss: 0.226, per_step_time: 1414ms, lr: 8.708715e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:15,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.65640 samples/s/p 0:12:45 } +2024-07-30 05:58:18,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2586/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 8.64467e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:18,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.66091 samples/s/p 0:12:41 } +2024-07-30 05:58:21,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2588/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 8.580774e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:21,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.66021 samples/s/p 0:12:38 } +2024-07-30 05:58:23,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2590/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 8.5171756e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:23,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.65899 samples/s/p 0:12:36 } +2024-07-30 05:58:26,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2592/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 8.453816e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:26,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.66038 samples/s/p 0:12:33 } +2024-07-30 05:58:29,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2594/ 3125], loss: 0.322, per_step_time: 1414ms, lr: 8.390635e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:29,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.65762 samples/s/p 0:12:30 } +2024-07-30 05:58:32,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2596/ 3125], loss: 0.275, per_step_time: 1414ms, lr: 8.327722e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:32,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.65534 samples/s/p 0:12:28 } +2024-07-30 05:58:35,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2598/ 3125], loss: 0.081, per_step_time: 1414ms, lr: 8.265048e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:35,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.65672 samples/s/p 0:12:25 } +2024-07-30 05:58:38,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2600/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 8.202642e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:38,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.66171 samples/s/p 0:12:21 } +2024-07-30 05:58:40,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2602/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 8.1404444e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:40,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.65915 samples/s/p 0:12:19 } +2024-07-30 05:58:43,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2604/ 3125], loss: 0.317, per_step_time: 1412ms, lr: 8.078426e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:43,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.66243 samples/s/p 0:12:16 } +2024-07-30 05:58:46,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2606/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 8.0167055e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:46,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.66104 samples/s/p 0:12:13 } +2024-07-30 05:58:49,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2608/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 7.955163e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:49,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.65938 samples/s/p 0:12:10 } +2024-07-30 05:58:52,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2610/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 7.893949e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:52,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.66117 samples/s/p 0:12:07 } +2024-07-30 05:58:55,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2612/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 7.8329144e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:55,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.66074 samples/s/p 0:12:04 } +2024-07-30 05:58:57,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2614/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 7.7721474e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:57,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.66089 samples/s/p 0:12:02 } +2024-07-30 05:59:00,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2616/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 7.7115295e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:00,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.66161 samples/s/p 0:11:59 } +2024-07-30 05:59:03,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2618/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 7.6512094e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:03,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.65952 samples/s/p 0:11:56 } +2024-07-30 05:59:06,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2620/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 7.591128e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:06,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.65918 samples/s/p 0:11:53 } +2024-07-30 05:59:09,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2622/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 7.5312556e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:09,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.65997 samples/s/p 0:11:50 } +2024-07-30 05:59:12,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2624/ 3125], loss: 0.343, per_step_time: 1425ms, lr: 7.47165e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:12,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.61176 samples/s/p 0:11:54 } +2024-07-30 05:59:14,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2626/ 3125], loss: 0.095, per_step_time: 1413ms, lr: 7.4122546e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:14,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.65876 samples/s/p 0:11:45 } +2024-07-30 05:59:17,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2628/ 3125], loss: 0.128, per_step_time: 1415ms, lr: 7.353127e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:17,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.65231 samples/s/p 0:11:43 } +2024-07-30 05:59:20,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2630/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 7.294178e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:20,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.66140 samples/s/p 0:11:39 } +2024-07-30 05:59:23,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2632/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 7.235497e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:23,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.66099 samples/s/p 0:11:36 } +2024-07-30 05:59:26,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2634/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 7.177055e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:26,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.65855 samples/s/p 0:11:34 } +2024-07-30 05:59:29,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2636/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 7.118821e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:29,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.65875 samples/s/p 0:11:31 } +2024-07-30 05:59:31,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2638/ 3125], loss: 0.309, per_step_time: 1414ms, lr: 7.0609154e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:31,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.65736 samples/s/p 0:11:28 } +2024-07-30 05:59:34,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2640/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 7.003158e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:34,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.65795 samples/s/p 0:11:25 } +2024-07-30 05:59:37,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2642/ 3125], loss: 0.435, per_step_time: 1415ms, lr: 6.94561e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:37,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.65316 samples/s/p 0:11:23 } +2024-07-30 05:59:40,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2644/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 6.8883594e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:40,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.65813 samples/s/p 0:11:20 } +2024-07-30 05:59:43,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2646/ 3125], loss: 0.293, per_step_time: 1413ms, lr: 6.831318e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:43,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.66053 samples/s/p 0:11:16 } +2024-07-30 05:59:46,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2648/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 6.774515e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:46,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.66019 samples/s/p 0:11:14 } +2024-07-30 05:59:48,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2650/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 6.71792e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:48,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.65899 samples/s/p 0:11:11 } +2024-07-30 05:59:51,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2652/ 3125], loss: 0.039, per_step_time: 1413ms, lr: 6.661624e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:51,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.66069 samples/s/p 0:11:08 } +2024-07-30 05:59:54,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2654/ 3125], loss: 0.388, per_step_time: 1413ms, lr: 6.605536e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:54,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.65781 samples/s/p 0:11:05 } +2024-07-30 05:59:57,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2656/ 3125], loss: 0.434, per_step_time: 1413ms, lr: 6.549686e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:57,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.66083 samples/s/p 0:11:02 } +2024-07-30 06:00:00,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2658/ 3125], loss: 0.437, per_step_time: 1415ms, lr: 6.494045e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:00,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.65305 samples/s/p 0:11:00 } +2024-07-30 06:00:03,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2660/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 6.4386725e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:03,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.66123 samples/s/p 0:10:57 } +2024-07-30 06:00:05,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2662/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 6.383538e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:05,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.65952 samples/s/p 0:10:54 } +2024-07-30 06:00:08,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2664/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 6.328612e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:08,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.65947 samples/s/p 0:10:51 } +2024-07-30 06:00:11,659 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2666/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 6.273955e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:11,660 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.66089 samples/s/p 0:10:48 } +2024-07-30 06:00:14,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2668/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 6.2194765e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:14,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.66069 samples/s/p 0:10:45 } +2024-07-30 06:00:17,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2670/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 6.1652656e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:17,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.66053 samples/s/p 0:10:43 } +2024-07-30 06:00:20,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2672/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 6.111294e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:20,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.65991 samples/s/p 0:10:40 } +2024-07-30 06:00:22,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2674/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 6.05759e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:22,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.66123 samples/s/p 0:10:37 } +2024-07-30 06:00:25,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2676/ 3125], loss: 0.108, per_step_time: 1413ms, lr: 6.0041245e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:25,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.66052 samples/s/p 0:10:34 } +2024-07-30 06:00:28,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2678/ 3125], loss: 0.241, per_step_time: 1414ms, lr: 5.950838e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:28,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.65746 samples/s/p 0:10:32 } +2024-07-30 06:00:31,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2680/ 3125], loss: 0.439, per_step_time: 1413ms, lr: 5.89779e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:31,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.66112 samples/s/p 0:10:28 } +2024-07-30 06:00:34,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2682/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 5.8449803e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:34,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.65811 samples/s/p 0:10:26 } +2024-07-30 06:00:37,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2684/ 3125], loss: 0.422, per_step_time: 1414ms, lr: 5.792439e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:37,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.65687 samples/s/p 0:10:23 } +2024-07-30 06:00:39,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2686/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 5.7401657e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:39,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.66132 samples/s/p 0:10:20 } +2024-07-30 06:00:42,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2688/ 3125], loss: 0.657, per_step_time: 1413ms, lr: 5.6880115e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:42,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.65976 samples/s/p 0:10:17 } +2024-07-30 06:00:45,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2690/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 5.6361852e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:45,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.65857 samples/s/p 0:10:14 } +2024-07-30 06:00:48,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2692/ 3125], loss: 0.253, per_step_time: 1414ms, lr: 5.5845973e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:48,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.65666 samples/s/p 0:10:12 } +2024-07-30 06:00:51,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2694/ 3125], loss: 0.072, per_step_time: 1414ms, lr: 5.5332183e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:51,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.65381 samples/s/p 0:10:09 } +2024-07-30 06:00:54,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2696/ 3125], loss: 0.481, per_step_time: 1414ms, lr: 5.4820475e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:54,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.65390 samples/s/p 0:10:07 } +2024-07-30 06:00:57,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2698/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 5.4311453e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:57,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.66035 samples/s/p 0:10:03 } +2024-07-30 06:00:59,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2700/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 5.3805113e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:59,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.66141 samples/s/p 0:10:00 } +2024-07-30 06:01:02,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2702/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 5.3300855e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:02,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.65871 samples/s/p 0:09:58 } +2024-07-30 06:01:05,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2704/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 5.2798686e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:05,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.65883 samples/s/p 0:09:55 } +2024-07-30 06:01:08,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2706/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 5.22992e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:08,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.65968 samples/s/p 0:09:52 } +2024-07-30 06:01:11,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2708/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 5.1802097e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:11,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.65790 samples/s/p 0:09:49 } +2024-07-30 06:01:14,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2710/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 5.1307378e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:14,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.65897 samples/s/p 0:09:46 } +2024-07-30 06:01:16,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2712/ 3125], loss: 0.024, per_step_time: 1414ms, lr: 5.081445e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:16,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.65698 samples/s/p 0:09:44 } +2024-07-30 06:01:19,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2714/ 3125], loss: 0.197, per_step_time: 1414ms, lr: 5.03242e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:19,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.65615 samples/s/p 0:09:41 } +2024-07-30 06:01:22,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2716/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 4.9836633e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:22,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.65893 samples/s/p 0:09:38 } +2024-07-30 06:01:25,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2718/ 3125], loss: 0.164, per_step_time: 1414ms, lr: 4.9351453e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:25,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.65535 samples/s/p 0:09:35 } +2024-07-30 06:01:28,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2720/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 4.886836e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:28,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.65970 samples/s/p 0:09:32 } +2024-07-30 06:01:31,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2722/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 4.8387644e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:31,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.65780 samples/s/p 0:09:29 } +2024-07-30 06:01:33,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2724/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 4.790902e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:33,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.65957 samples/s/p 0:09:26 } +2024-07-30 06:01:36,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2726/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 4.7433375e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:36,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.66084 samples/s/p 0:09:23 } +2024-07-30 06:01:39,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2728/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 4.6959517e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:39,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.65848 samples/s/p 0:09:21 } +2024-07-30 06:01:42,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2730/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 4.6488342e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:42,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.65949 samples/s/p 0:09:18 } +2024-07-30 06:01:45,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2732/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 4.601985e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:45,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.65898 samples/s/p 0:09:15 } +2024-07-30 06:01:48,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2734/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 4.5553147e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:48,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.66094 samples/s/p 0:09:12 } +2024-07-30 06:01:50,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2736/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 4.5088825e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:50,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.66014 samples/s/p 0:09:09 } +2024-07-30 06:01:53,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2738/ 3125], loss: 0.397, per_step_time: 1413ms, lr: 4.462689e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:53,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.66020 samples/s/p 0:09:06 } +2024-07-30 06:01:56,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2740/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 4.416764e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:56,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.66110 samples/s/p 0:09:04 } +2024-07-30 06:01:59,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2742/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 4.3710767e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:59,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.66007 samples/s/p 0:09:01 } +2024-07-30 06:02:02,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2744/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 4.3255984e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:02,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.66006 samples/s/p 0:08:58 } +2024-07-30 06:02:05,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2746/ 3125], loss: 0.068, per_step_time: 1412ms, lr: 4.2803883e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:05,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |███████████████████████████████████████████████ | 5.66201 samples/s/p 0:08:55 } +2024-07-30 06:02:07,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2748/ 3125], loss: 0.357, per_step_time: 1414ms, lr: 4.2353868e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:07,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |███████████████████████████████████████████████ | 5.65660 samples/s/p 0:08:53 } +2024-07-30 06:02:10,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2750/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 4.1906535e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:10,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.65931 samples/s/p 0:08:50 } +2024-07-30 06:02:13,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2752/ 3125], loss: 0.364, per_step_time: 1415ms, lr: 4.1461288e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:13,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.65288 samples/s/p 0:08:47 } +2024-07-30 06:02:16,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2754/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 4.1018424e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:16,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.65963 samples/s/p 0:08:44 } +2024-07-30 06:02:19,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2756/ 3125], loss: 0.309, per_step_time: 1414ms, lr: 4.0577948e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:19,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.65400 samples/s/p 0:08:42 } +2024-07-30 06:02:22,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2758/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 4.014015e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:22,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.66116 samples/s/p 0:08:38 } +2024-07-30 06:02:24,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2760/ 3125], loss: 0.477, per_step_time: 1414ms, lr: 3.9704442e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:24,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.65535 samples/s/p 0:08:36 } +2024-07-30 06:02:27,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2762/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 3.9270518e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:27,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.66001 samples/s/p 0:08:33 } +2024-07-30 06:02:30,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2764/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 3.8839875e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:30,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.66100 samples/s/p 0:08:30 } +2024-07-30 06:02:33,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2766/ 3125], loss: 0.214, per_step_time: 1412ms, lr: 3.841102e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:33,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.66172 samples/s/p 0:08:27 } +2024-07-30 06:02:36,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2768/ 3125], loss: 0.448, per_step_time: 1413ms, lr: 3.7985146e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:36,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.66055 samples/s/p 0:08:24 } +2024-07-30 06:02:39,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2770/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 3.7561357e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:39,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.66107 samples/s/p 0:08:21 } +2024-07-30 06:02:41,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2772/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 3.7139653e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:41,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.66095 samples/s/p 0:08:18 } +2024-07-30 06:02:44,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2774/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 3.6720333e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:44,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.66015 samples/s/p 0:08:16 } +2024-07-30 06:02:47,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2776/ 3125], loss: 0.407, per_step_time: 1412ms, lr: 3.63034e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:47,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.66217 samples/s/p 0:08:13 } +2024-07-30 06:02:50,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2778/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 3.5889446e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:50,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.65970 samples/s/p 0:08:10 } +2024-07-30 06:02:53,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2780/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 3.5476685e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:53,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.66154 samples/s/p 0:08:07 } +2024-07-30 06:02:56,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2782/ 3125], loss: 0.459, per_step_time: 1414ms, lr: 3.5067497e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:56,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.65665 samples/s/p 0:08:05 } +2024-07-30 06:02:58,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2784/ 3125], loss: 0.311, per_step_time: 1416ms, lr: 3.46601e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:58,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.64915 samples/s/p 0:08:02 } +2024-07-30 06:03:01,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2786/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 3.4255386e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:01,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.66085 samples/s/p 0:07:59 } +2024-07-30 06:03:04,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2788/ 3125], loss: 0.211, per_step_time: 1414ms, lr: 3.3852753e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:04,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.65746 samples/s/p 0:07:56 } +2024-07-30 06:03:07,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2790/ 3125], loss: 0.353, per_step_time: 1414ms, lr: 3.3452807e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:07,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.65655 samples/s/p 0:07:53 } +2024-07-30 06:03:10,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2792/ 3125], loss: 0.171, per_step_time: 1414ms, lr: 3.3054945e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:10,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.65675 samples/s/p 0:07:50 } +2024-07-30 06:03:13,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2794/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 3.265947e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:13,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.65953 samples/s/p 0:07:47 } +2024-07-30 06:03:15,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2796/ 3125], loss: 0.270, per_step_time: 1414ms, lr: 3.226608e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:15,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.65579 samples/s/p 0:07:45 } +2024-07-30 06:03:18,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2798/ 3125], loss: 0.333, per_step_time: 1414ms, lr: 3.187567e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:18,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.65651 samples/s/p 0:07:42 } +2024-07-30 06:03:21,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2800/ 3125], loss: 0.323, per_step_time: 1413ms, lr: 3.1487644e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:21,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.65849 samples/s/p 0:07:39 } +2024-07-30 06:03:24,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2802/ 3125], loss: 0.151, per_step_time: 1414ms, lr: 3.1101703e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:24,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.65628 samples/s/p 0:07:36 } +2024-07-30 06:03:27,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2804/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 3.071755e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:27,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.66168 samples/s/p 0:07:33 } +2024-07-30 06:03:30,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2806/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 3.033668e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:30,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.65938 samples/s/p 0:07:30 } +2024-07-30 06:03:32,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2808/ 3125], loss: 0.221, per_step_time: 1414ms, lr: 2.995759e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:32,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.65661 samples/s/p 0:07:28 } +2024-07-30 06:03:35,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2810/ 3125], loss: 0.115, per_step_time: 1412ms, lr: 2.9581486e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:35,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.66193 samples/s/p 0:07:25 } +2024-07-30 06:03:38,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2812/ 3125], loss: 0.130, per_step_time: 1413ms, lr: 2.920717e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:38,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.66080 samples/s/p 0:07:22 } +2024-07-30 06:03:41,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2814/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 2.8835236e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:41,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.66117 samples/s/p 0:07:19 } +2024-07-30 06:03:44,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2816/ 3125], loss: 0.315, per_step_time: 1412ms, lr: 2.8466582e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:44,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.66206 samples/s/p 0:07:16 } +2024-07-30 06:03:47,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2818/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 2.8099416e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:47,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.66092 samples/s/p 0:07:13 } +2024-07-30 06:03:49,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2820/ 3125], loss: 0.441, per_step_time: 1413ms, lr: 2.773434e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:49,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.66157 samples/s/p 0:07:10 } +2024-07-30 06:03:52,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2822/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 2.7372538e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:52,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.65920 samples/s/p 0:07:08 } +2024-07-30 06:03:55,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2824/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 2.7012526e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:55,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.65898 samples/s/p 0:07:05 } +2024-07-30 06:03:58,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2826/ 3125], loss: 0.407, per_step_time: 1413ms, lr: 2.6655197e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:58,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.65901 samples/s/p 0:07:02 } +2024-07-30 06:04:01,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2828/ 3125], loss: 0.230, per_step_time: 1415ms, lr: 2.6299952e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:01,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.65340 samples/s/p 0:07:00 } +2024-07-30 06:04:04,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2830/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 2.5947392e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:04,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.66121 samples/s/p 0:06:56 } +2024-07-30 06:04:06,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2832/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 2.5597213e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:06,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.65986 samples/s/p 0:06:54 } +2024-07-30 06:04:09,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2834/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 2.5248527e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:09,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.66093 samples/s/p 0:06:51 } +2024-07-30 06:04:12,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2836/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 2.4903715e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:12,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.65807 samples/s/p 0:06:48 } +2024-07-30 06:04:15,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2838/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 2.4560093e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:15,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.65890 samples/s/p 0:06:45 } +2024-07-30 06:04:18,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2840/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 2.4219453e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:18,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.65668 samples/s/p 0:06:43 } +2024-07-30 06:04:21,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2842/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 2.3881196e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:21,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.65916 samples/s/p 0:06:40 } +2024-07-30 06:04:23,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2844/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 2.3544729e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:23,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.66031 samples/s/p 0:06:37 } +2024-07-30 06:04:26,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2846/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 2.3211241e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:26,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.65838 samples/s/p 0:06:34 } +2024-07-30 06:04:29,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2848/ 3125], loss: 0.345, per_step_time: 1414ms, lr: 2.2880137e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:29,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.65738 samples/s/p 0:06:31 } +2024-07-30 06:04:32,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2850/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 2.255082e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:32,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.65957 samples/s/p 0:06:28 } +2024-07-30 06:04:35,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2852/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 2.2224187e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:35,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.65793 samples/s/p 0:06:26 } +2024-07-30 06:04:38,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2854/ 3125], loss: 0.231, per_step_time: 1414ms, lr: 2.1899938e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:38,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.65466 samples/s/p 0:06:23 } +2024-07-30 06:04:40,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2856/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 2.1578073e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:40,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.65789 samples/s/p 0:06:20 } +2024-07-30 06:04:43,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2858/ 3125], loss: 0.124, per_step_time: 1414ms, lr: 2.125889e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:43,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.65762 samples/s/p 0:06:17 } +2024-07-30 06:04:46,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2860/ 3125], loss: 0.263, per_step_time: 1414ms, lr: 2.0941794e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:46,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.65700 samples/s/p 0:06:14 } +2024-07-30 06:04:49,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2862/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 2.0627379e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:49,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.65876 samples/s/p 0:06:11 } +2024-07-30 06:04:52,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2864/ 3125], loss: 0.192, per_step_time: 1419ms, lr: 2.0314753e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:52,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.63396 samples/s/p 0:06:10 } +2024-07-30 06:04:55,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2866/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 2.0005107e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:55,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.65774 samples/s/p 0:06:06 } +2024-07-30 06:04:57,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2868/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 1.9697248e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:57,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.65774 samples/s/p 0:06:03 } +2024-07-30 06:05:00,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2870/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 1.9392072e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:00,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.65980 samples/s/p 0:06:00 } +2024-07-30 06:05:03,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2872/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 1.908958e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:03,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.65935 samples/s/p 0:05:57 } +2024-07-30 06:05:06,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2874/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 1.8788874e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:06,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.66035 samples/s/p 0:05:54 } +2024-07-30 06:05:09,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2876/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 1.849085e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:09,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.65987 samples/s/p 0:05:51 } +2024-07-30 06:05:12,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2878/ 3125], loss: 0.268, per_step_time: 1413ms, lr: 1.819521e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:12,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.65837 samples/s/p 0:05:49 } +2024-07-30 06:05:14,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2880/ 3125], loss: 0.092, per_step_time: 1412ms, lr: 1.7902254e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:14,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.66174 samples/s/p 0:05:46 } +2024-07-30 06:05:17,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2882/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 1.7611086e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:17,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.65958 samples/s/p 0:05:43 } +2024-07-30 06:05:20,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2884/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 1.73226e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:20,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.66028 samples/s/p 0:05:40 } +2024-07-30 06:05:23,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2886/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 1.7036497e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:23,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.66043 samples/s/p 0:05:37 } +2024-07-30 06:05:26,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2888/ 3125], loss: 0.341, per_step_time: 1414ms, lr: 1.6752184e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:26,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.65676 samples/s/p 0:05:35 } +2024-07-30 06:05:29,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2890/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 1.6471148e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:29,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.66021 samples/s/p 0:05:32 } +2024-07-30 06:05:31,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2892/ 3125], loss: 0.404, per_step_time: 1414ms, lr: 1.6192198e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:31,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.65746 samples/s/p 0:05:29 } +2024-07-30 06:05:34,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2894/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 1.5915631e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:34,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.65990 samples/s/p 0:05:26 } +2024-07-30 06:05:37,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2896/ 3125], loss: 0.167, per_step_time: 1415ms, lr: 1.5641152e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:37,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.65325 samples/s/p 0:05:24 } +2024-07-30 06:05:40,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2898/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 1.5369654e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:40,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.66089 samples/s/p 0:05:20 } +2024-07-30 06:05:43,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2900/ 3125], loss: 0.129, per_step_time: 1413ms, lr: 1.5099644e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:43,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.65903 samples/s/p 0:05:18 } +2024-07-30 06:05:46,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2902/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 1.4832615e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:46,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.65976 samples/s/p 0:05:15 } +2024-07-30 06:05:48,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2904/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 1.4568269e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:48,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.65905 samples/s/p 0:05:12 } +2024-07-30 06:05:51,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2906/ 3125], loss: 0.186, per_step_time: 1414ms, lr: 1.4305412e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:51,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.65696 samples/s/p 0:05:09 } +2024-07-30 06:05:54,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2908/ 3125], loss: 0.381, per_step_time: 1414ms, lr: 1.4045536e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:54,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.65658 samples/s/p 0:05:06 } +2024-07-30 06:05:57,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2910/ 3125], loss: 0.063, per_step_time: 1413ms, lr: 1.3787746e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:57,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.65774 samples/s/p 0:05:04 } +2024-07-30 06:06:00,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2912/ 3125], loss: 0.152, per_step_time: 1424ms, lr: 1.35329365e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:00,310 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.61424 samples/s/p 0:05:03 } +2024-07-30 06:06:03,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2914/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 1.3279915e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:03,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.66012 samples/s/p 0:04:58 } +2024-07-30 06:06:05,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2916/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 1.3029575e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:05,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.66034 samples/s/p 0:04:55 } +2024-07-30 06:06:08,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2918/ 3125], loss: 0.290, per_step_time: 1415ms, lr: 1.2781322e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:08,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.65049 samples/s/p 0:04:53 } +2024-07-30 06:06:11,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2920/ 3125], loss: 0.135, per_step_time: 1417ms, lr: 1.253575e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:11,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.64366 samples/s/p 0:04:50 } +2024-07-30 06:06:14,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2922/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 1.2292862e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:14,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.66102 samples/s/p 0:04:46 } +2024-07-30 06:06:17,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2924/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 1.20517605e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:17,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.65871 samples/s/p 0:04:44 } +2024-07-30 06:06:20,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2926/ 3125], loss: 0.231, per_step_time: 1415ms, lr: 1.1813044e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:20,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.65217 samples/s/p 0:04:41 } +2024-07-30 06:06:23,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2928/ 3125], loss: 0.131, per_step_time: 1414ms, lr: 1.1576712e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:23,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.65737 samples/s/p 0:04:38 } +2024-07-30 06:06:25,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2930/ 3125], loss: 0.466, per_step_time: 1413ms, lr: 1.1342763e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:25,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.66048 samples/s/p 0:04:35 } +2024-07-30 06:06:28,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2932/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 1.1111796e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:28,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.66025 samples/s/p 0:04:32 } +2024-07-30 06:06:31,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2934/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 1.0882616e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:31,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |████████████████████████████████████████████████ | 5.65663 samples/s/p 0:04:30 } +2024-07-30 06:06:34,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2936/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 1.0656118e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:34,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |████████████████████████████████████████████████ | 5.65991 samples/s/p 0:04:27 } +2024-07-30 06:06:37,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2938/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 1.0431707e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:37,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.65906 samples/s/p 0:04:24 } +2024-07-30 06:06:40,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2940/ 3125], loss: 0.265, per_step_time: 1412ms, lr: 1.0209978e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:40,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.66172 samples/s/p 0:04:21 } +2024-07-30 06:06:42,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2942/ 3125], loss: 0.220, per_step_time: 1414ms, lr: 9.990334e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:42,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.65513 samples/s/p 0:04:18 } +2024-07-30 06:06:45,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2944/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 9.773076e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:45,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.65858 samples/s/p 0:04:15 } +2024-07-30 06:06:48,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2946/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 9.558499e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:48,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.65774 samples/s/p 0:04:13 } +2024-07-30 06:06:51,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2948/ 3125], loss: 0.209, per_step_time: 1414ms, lr: 9.346604e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:51,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.65572 samples/s/p 0:04:10 } +2024-07-30 06:06:54,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2950/ 3125], loss: 0.284, per_step_time: 1412ms, lr: 9.136498e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:54,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.66183 samples/s/p 0:04:07 } +2024-07-30 06:06:57,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2952/ 3125], loss: 0.452, per_step_time: 1413ms, lr: 8.9284775e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:57,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.65843 samples/s/p 0:04:04 } +2024-07-30 06:06:59,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2954/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 8.723438e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:59,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.65623 samples/s/p 0:04:01 } +2024-07-30 06:07:02,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2956/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 8.520781e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:02,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.65970 samples/s/p 0:03:58 } +2024-07-30 06:07:05,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2958/ 3125], loss: 0.130, per_step_time: 1414ms, lr: 8.320212e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:05,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.65521 samples/s/p 0:03:56 } +2024-07-30 06:07:08,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2960/ 3125], loss: 0.097, per_step_time: 1414ms, lr: 8.122623e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:08,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.65411 samples/s/p 0:03:53 } +2024-07-30 06:07:11,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2962/ 3125], loss: 0.430, per_step_time: 1413ms, lr: 7.926523e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:11,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.66084 samples/s/p 0:03:50 } +2024-07-30 06:07:14,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2964/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 7.733404e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:14,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.66168 samples/s/p 0:03:47 } +2024-07-30 06:07:16,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2966/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 7.542371e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:16,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.66093 samples/s/p 0:03:44 } +2024-07-30 06:07:19,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2968/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 7.354021e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:19,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.65908 samples/s/p 0:03:41 } +2024-07-30 06:07:22,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2970/ 3125], loss: 0.252, per_step_time: 1414ms, lr: 7.167458e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:22,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.65623 samples/s/p 0:03:39 } +2024-07-30 06:07:25,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2972/ 3125], loss: 0.431, per_step_time: 1413ms, lr: 6.983876e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:25,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.65937 samples/s/p 0:03:36 } +2024-07-30 06:07:28,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2974/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 6.802976e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:28,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.65823 samples/s/p 0:03:33 } +2024-07-30 06:07:31,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2976/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 6.623864e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:31,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.65972 samples/s/p 0:03:30 } +2024-07-30 06:07:33,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2978/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 6.447136e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:33,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.65974 samples/s/p 0:03:27 } +2024-07-30 06:07:36,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2980/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 6.2727925e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:36,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.66001 samples/s/p 0:03:24 } +2024-07-30 06:07:39,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2982/ 3125], loss: 0.104, per_step_time: 1413ms, lr: 6.101131e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:39,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.65959 samples/s/p 0:03:22 } +2024-07-30 06:07:42,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2984/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 5.931854e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:42,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.66031 samples/s/p 0:03:19 } +2024-07-30 06:07:45,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2986/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 5.764663e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:45,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.65839 samples/s/p 0:03:16 } +2024-07-30 06:07:48,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2988/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 5.600452e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:48,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.66146 samples/s/p 0:03:13 } +2024-07-30 06:07:50,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2990/ 3125], loss: 0.353, per_step_time: 1414ms, lr: 5.4374336e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:50,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.65732 samples/s/p 0:03:10 } +2024-07-30 06:07:53,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2992/ 3125], loss: 0.474, per_step_time: 1413ms, lr: 5.277693e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:53,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.65940 samples/s/p 0:03:08 } +2024-07-30 06:07:56,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2994/ 3125], loss: 0.334, per_step_time: 1413ms, lr: 5.120039e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:56,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.65783 samples/s/p 0:03:05 } +2024-07-30 06:07:59,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2996/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 4.965365e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:59,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.66045 samples/s/p 0:03:02 } +2024-07-30 06:08:02,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2998/ 3125], loss: 0.109, per_step_time: 1414ms, lr: 4.812181e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:02,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.65741 samples/s/p 0:02:59 } +2024-07-30 06:08:05,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3000/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 4.6625734e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:05,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.65838 samples/s/p 0:02:56 } +2024-07-30 06:08:07,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3002/ 3125], loss: 0.179, per_step_time: 1414ms, lr: 4.5138595e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:07,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.65745 samples/s/p 0:02:53 } +2024-07-30 06:08:10,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3004/ 3125], loss: 0.333, per_step_time: 1415ms, lr: 4.3684243e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:10,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.65365 samples/s/p 0:02:51 } +2024-07-30 06:08:13,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3006/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 4.225373e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:13,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.65827 samples/s/p 0:02:48 } +2024-07-30 06:08:16,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3008/ 3125], loss: 0.352, per_step_time: 1414ms, lr: 4.0844084e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:16,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.65729 samples/s/p 0:02:45 } +2024-07-30 06:08:19,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3010/ 3125], loss: 0.381, per_step_time: 1413ms, lr: 3.946125e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:19,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.65991 samples/s/p 0:02:42 } +2024-07-30 06:08:22,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3012/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 3.809929e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:22,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.66133 samples/s/p 0:02:39 } +2024-07-30 06:08:24,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3014/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 3.6761163e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:24,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.65918 samples/s/p 0:02:36 } +2024-07-30 06:08:27,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3016/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 3.544986e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:27,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.66126 samples/s/p 0:02:34 } +2024-07-30 06:08:30,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3018/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 3.4165382e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:30,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.65931 samples/s/p 0:02:31 } +2024-07-30 06:08:33,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3020/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 3.2895802e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:33,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.66070 samples/s/p 0:02:28 } +2024-07-30 06:08:36,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3022/ 3125], loss: 0.099, per_step_time: 1414ms, lr: 3.1656027e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:36,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.65436 samples/s/p 0:02:25 } +2024-07-30 06:08:39,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3024/ 3125], loss: 0.406, per_step_time: 1413ms, lr: 3.043711e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:39,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.65989 samples/s/p 0:02:22 } +2024-07-30 06:08:41,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3026/ 3125], loss: 0.065, per_step_time: 1413ms, lr: 2.9245018e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:41,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.66078 samples/s/p 0:02:19 } +2024-07-30 06:08:44,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3028/ 3125], loss: 0.321, per_step_time: 1414ms, lr: 2.8073788e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:44,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.65435 samples/s/p 0:02:17 } +2024-07-30 06:08:47,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3030/ 3125], loss: 0.028, per_step_time: 1413ms, lr: 2.6926397e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:47,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.65915 samples/s/p 0:02:14 } +2024-07-30 06:08:50,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3032/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 2.580881e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:50,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.65859 samples/s/p 0:02:11 } +2024-07-30 06:08:53,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3034/ 3125], loss: 0.190, per_step_time: 1416ms, lr: 2.4709106e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:53,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.64690 samples/s/p 0:02:08 } +2024-07-30 06:08:56,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3036/ 3125], loss: 0.496, per_step_time: 1413ms, lr: 2.3639202e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:56,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.65916 samples/s/p 0:02:05 } +2024-07-30 06:08:58,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3038/ 3125], loss: 0.532, per_step_time: 1415ms, lr: 2.2587179e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:58,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.65295 samples/s/p 0:02:03 } +2024-07-30 06:09:01,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3040/ 3125], loss: 0.358, per_step_time: 1412ms, lr: 2.155602e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:01,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.66244 samples/s/p 0:02:00 } +2024-07-30 06:09:04,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3042/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 2.0557642e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:04,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.65904 samples/s/p 0:01:57 } +2024-07-30 06:09:07,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3044/ 3125], loss: 0.201, per_step_time: 1414ms, lr: 1.9577144e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:07,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.65661 samples/s/p 0:01:54 } +2024-07-30 06:09:10,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3046/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 1.8620491e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:10,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.65813 samples/s/p 0:01:51 } +2024-07-30 06:09:13,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3048/ 3125], loss: 0.417, per_step_time: 1417ms, lr: 1.7693639e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:13,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.64519 samples/s/p 0:01:49 } +2024-07-30 06:09:15,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3050/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 1.6784667e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:15,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.65850 samples/s/p 0:01:46 } +2024-07-30 06:09:18,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3052/ 3125], loss: 0.300, per_step_time: 1415ms, lr: 1.5902519e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:18,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.65246 samples/s/p 0:01:43 } +2024-07-30 06:09:21,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3054/ 3125], loss: 0.165, per_step_time: 1414ms, lr: 1.5044211e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:21,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.65690 samples/s/p 0:01:40 } +2024-07-30 06:09:24,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3056/ 3125], loss: 0.212, per_step_time: 1412ms, lr: 1.4206767e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:24,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.66235 samples/s/p 0:01:37 } +2024-07-30 06:09:27,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3058/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 1.3396143e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:27,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.65823 samples/s/p 0:01:34 } +2024-07-30 06:09:30,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3060/ 3125], loss: 0.296, per_step_time: 1412ms, lr: 1.2612342e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:30,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.66244 samples/s/p 0:01:31 } +2024-07-30 06:09:32,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3062/ 3125], loss: 0.255, per_step_time: 1415ms, lr: 1.1846423e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:32,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.65355 samples/s/p 0:01:29 } +2024-07-30 06:09:35,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3064/ 3125], loss: 0.113, per_step_time: 1413ms, lr: 1.1107325e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:35,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.66136 samples/s/p 0:01:26 } +2024-07-30 06:09:38,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3066/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 1.038909e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:38,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.66112 samples/s/p 0:01:23 } +2024-07-30 06:09:41,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3068/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 9.694695e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:41,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.65954 samples/s/p 0:01:20 } +2024-07-30 06:09:44,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3070/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 9.0271235e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:44,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.66032 samples/s/p 0:01:17 } +2024-07-30 06:09:47,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3072/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 8.380413e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:47,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.65923 samples/s/p 0:01:14 } +2024-07-30 06:09:49,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3074/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 7.7605244e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:49,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.66026 samples/s/p 0:01:12 } +2024-07-30 06:09:52,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3076/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 7.161498e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:52,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.66132 samples/s/p 0:01:09 } +2024-07-30 06:09:55,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3078/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 6.595254e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:55,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.65903 samples/s/p 0:01:06 } +2024-07-30 06:09:58,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3080/ 3125], loss: 0.265, per_step_time: 1414ms, lr: 6.043911e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:58,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.65513 samples/s/p 0:01:03 } +2024-07-30 06:10:01,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3082/ 3125], loss: 0.177, per_step_time: 1414ms, lr: 5.5164096e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:01,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.65625 samples/s/p 0:01:00 } +2024-07-30 06:10:04,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3084/ 3125], loss: 0.305, per_step_time: 1414ms, lr: 5.0157306e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:04,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.65705 samples/s/p 0:00:57 } +2024-07-30 06:10:06,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3086/ 3125], loss: 0.515, per_step_time: 1415ms, lr: 4.5418738e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:06,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.65354 samples/s/p 0:00:55 } +2024-07-30 06:10:09,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3088/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 4.0858983e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:09,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.65823 samples/s/p 0:00:52 } +2024-07-30 06:10:12,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3090/ 3125], loss: 0.113, per_step_time: 1414ms, lr: 3.6537645e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:12,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.65669 samples/s/p 0:00:49 } +2024-07-30 06:10:15,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3092/ 3125], loss: 0.268, per_step_time: 1414ms, lr: 3.2514333e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:15,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.65391 samples/s/p 0:00:46 } +2024-07-30 06:10:18,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3094/ 3125], loss: 0.468, per_step_time: 1413ms, lr: 2.8669833e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:18,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.66018 samples/s/p 0:00:43 } +2024-07-30 06:10:21,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3096/ 3125], loss: 0.111, per_step_time: 1412ms, lr: 2.5063754e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:21,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.66212 samples/s/p 0:00:40 } +2024-07-30 06:10:23,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3098/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 2.1785497e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:23,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.65821 samples/s/p 0:00:38 } +2024-07-30 06:10:26,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3100/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 1.8656253e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:26,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.65938 samples/s/p 0:00:35 } +2024-07-30 06:10:29,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3102/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 1.5825033e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:29,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.65895 samples/s/p 0:00:32 } +2024-07-30 06:10:32,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3104/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 1.3172625e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:32,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.66116 samples/s/p 0:00:29 } +2024-07-30 06:10:35,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3106/ 3125], loss: 0.294, per_step_time: 1412ms, lr: 1.0818243e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:35,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.66204 samples/s/p 0:00:26 } +2024-07-30 06:10:38,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3108/ 3125], loss: 0.070, per_step_time: 1413ms, lr: 8.612871e-11, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:38,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.66018 samples/s/p 0:00:24 } +2024-07-30 06:10:40,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3110/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 6.705522e-11, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:40,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.65998 samples/s/p 0:00:21 } +2024-07-30 06:10:43,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3112/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 5.0663945e-11, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:43,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.65954 samples/s/p 0:00:18 } +2024-07-30 06:10:46,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3114/ 3125], loss: 0.175, per_step_time: 1414ms, lr: 3.606081e-11, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:46,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.65513 samples/s/p 0:00:15 } +2024-07-30 06:10:49,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3116/ 3125], loss: 0.208, per_step_time: 1414ms, lr: 2.3841857e-11, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:49,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.65458 samples/s/p 0:00:12 } +2024-07-30 06:10:52,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3118/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 1.4603138e-11, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:52,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.65863 samples/s/p 0:00:09 } +2024-07-30 06:10:55,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3120/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 7.45058e-12, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:55,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.65818 samples/s/p 0:00:07 } +2024-07-30 06:10:57,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3122/ 3125], loss: 0.388, per_step_time: 1414ms, lr: 2.682209e-12, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:57,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |█████████████████████████████████████████████████ | 5.65681 samples/s/p 0:00:04 } +2024-07-30 06:11:00,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3124/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 2.9802322e-13, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:11:00,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |█████████████████████████████████████████████████ | 5.65942 samples/s/p 0:00:01 } +2024-07-30 06:11:00,848 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 06:11:34,128 - mindformers[mindformers/trainer/base_trainer.py:779] - INFO - .........Training Over!............. diff --git "a/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/2. \345\276\256\350\260\203\346\227\245\345\277\227\344\270\216\351\205\215\347\275\256/finetune_msrun_log/worker_3.log" "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/2. \345\276\256\350\260\203\346\227\245\345\277\227\344\270\216\351\205\215\347\275\256/finetune_msrun_log/worker_3.log" new file mode 100644 index 00000000..76bd4735 --- /dev/null +++ "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/2. \345\276\256\350\260\203\346\227\245\345\277\227\344\270\216\351\205\215\347\275\256/finetune_msrun_log/worker_3.log" @@ -0,0 +1,10018 @@ +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:499: UserWarning: The value of the smallest subnormal for type is zero. + setattr(self, word, getattr(machar, word).flat[0]) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:89: UserWarning: The value of the smallest subnormal for type is zero. + return self._float_to_str(self.smallest_subnormal) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:499: UserWarning: The value of the smallest subnormal for type is zero. + setattr(self, word, getattr(machar, word).flat[0]) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:89: UserWarning: The value of the smallest subnormal for type is zero. + return self._float_to_str(self.smallest_subnormal) +[WARNING] DISTRIBUTED(979001,ffff9d477010,python):2024-07-30-02:07:41.164.963 [mindspore/ccsrc/distributed/rpc/tcp/tcp_comm.cc:464] Connect] Waiting for the state of the connection to 127.0.0.1:8118 to be connected...Retry number: 1 +[WARNING] DISTRIBUTED(979001,ffff9d477010,python):2024-07-30-02:07:42.165.197 [mindspore/ccsrc/distributed/rpc/tcp/tcp_comm.cc:464] Connect] Waiting for the state of the connection to 127.0.0.1:8118 to be connected...Retry number: 2 +[WARNING] DISTRIBUTED(979001,ffff9d477010,python):2024-07-30-02:07:43.166.022 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:194] BuildCluster] Topology build timed out., retry(1/200). +[WARNING] DISTRIBUTED(979001,ffff9d477010,python):2024-07-30-02:07:46.166.160 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:196] BuildCluster] Cluster is successfully initialized. +[WARNING] DISTRIBUTED(979001,ffff9d477010,python):2024-07-30-02:07:46.166.554 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:260] PostProcess] This node 3 rank id: 3 +[WARNING] DISTRIBUTED(979001,ffff9d477010,python):2024-07-30-02:08:11.273.534 [mindspore/ccsrc/distributed/collective/collective_manager.cc:259] CreateCommunicationGroup] Start to create communication group: hccl_world_group [const vector]{0, 1, 2, 3} +[WARNING] DEVICE(979001,ffff9d477010,python):2024-07-30-02:08:11.274.137 [mindspore/ccsrc/plugin/device/cpu/hal/hardware/ms_collective_comm_lib.cc:200] QueryUniqueID] Retry to lookup the unique id for group hccl_world_group from the meta server node...Retry time: 199/200 +[WARNING] DISTRIBUTED(979001,ffff9d477010,python):2024-07-30-02:08:14.274.575 [mindspore/ccsrc/distributed/collective/collective_manager.cc:335] CreateCommunicationGroup] Begin initialize communication group on the device side: hccl_world_group +[WARNING] DISTRIBUTED(979001,ffff9d477010,python):2024-07-30-02:08:14.504.137 [mindspore/ccsrc/distributed/collective/collective_manager.cc:345] CreateCommunicationGroup] End initialize communication group on the device side: hccl_world_group +2024-07-30 02:08:14,507 - mindformers[mindformers/tools/utils.py:168] - INFO - set strategy path to './output/strategy/ckpt_strategy_rank_3.ckpt' +2024-07-30 02:08:14,541 - mindformers[mindformers/trainer/trainer.py:919] - INFO - Load configs in /home/ma-user/work/mindformers/configs/gpt2/run_gpt2.yaml to build trainer. +2024-07-30 02:08:14,541 - mindformers[mindformers/trainer/trainer.py:949] - INFO - ..........Init Config.......... +2024-07-30 02:08:14,542 - mindformers[mindformers/core/parallel_config.py:45] - INFO - initial recompute_config from dict: {'recompute': True, 'select_recompute': False, 'parallel_optimizer_comm_recompute': False, 'mp_comm_recompute': True, 'recompute_slice_activation': True} +2024-07-30 02:08:14,542 - mindformers[mindformers/core/parallel_config.py:51] - INFO - initial parallel_config from dict: {'data_parallel': 1, 'model_parallel': 4, 'pipeline_stage': 1, 'use_seq_parallel': False, 'micro_batch_num': 1, 'vocab_emb_dp': True, 'gradient_aggregation_group': 4} +2024-07-30 02:08:14,543 - mindformers[mindformers/tools/utils.py:153] - INFO - set output path to '/home/ma-user/work/mindformers/research/output' +2024-07-30 02:08:14,543 - mindformers[mindformers/trainer/base_trainer.py:85] - INFO - Now Running Task is: text_generation, Model is: llama3_8b +2024-07-30 02:08:14,544 - mindformers[mindformers/trainer/base_trainer.py:111] - WARNING - Input model name is not in the supported list or unspecified. +2024-07-30 02:08:14,544 - mindformers[mindformers/trainer/base_trainer.py:112] - WARNING - See the list of supported task and model name: ['baichuan2_13b', 'baichuan2_7b', 'baichuan_7b', 'bloom_176b', 'bloom_560m', 'bloom_65b', 'bloom_7.1b', 'codegeex2_6b', 'codellama_34b', 'common', 'deepseek_33b', 'glm2_6b', 'glm2_6b_lora', 'glm2_6b_ptuning2', 'glm3_6b', 'glm_6b', 'glm_6b_chat', 'glm_6b_lora', 'glm_6b_lora_chat', 'gpt2', 'gpt2_13b', 'gpt2_52b', 'gpt2_lora', 'gpt2_xl', 'gpt2_xl_lora', 'internlm_7b', 'internlm_7b_lora', 'llama2_13b', 'llama2_70b', 'llama2_7b', 'llama_13b', 'llama_65b', 'llama_7b', 'llama_7b_lora', 'pangualpha_13b', 'pangualpha_2_6b', 'qwen_7b', 'qwen_7b_lora', 'skywork_13b', 'yi_34b', 'yi_6b', 'ziya_13b'] +2024-07-30 02:08:14,544 - mindformers[mindformers/trainer/base_trainer.py:113] - WARNING - The default model config: /home/ma-user/work/mindformers/configs/gpt2/run_gpt2.yaml will now be used for the text_generation task +2024-07-30 02:08:14,544 - mindformers[mindformers/trainer/trainer.py:1004] - INFO - ..........Init Model.......... +2024-07-30 02:08:14,545 - mindformers[mindformers/trainer/trainer.py:1027] - INFO - ..........Init Train Dataset.......... +2024-07-30 02:08:14,545 - mindformers[mindformers/trainer/trainer.py:335] - INFO - ==========Trainer Init Success!========== +2024-07-30 02:08:14,545 - mindformers[mindformers/trainer/trainer.py:476] - WARNING - The `finetune_checkpoint` will be deprecated. Please use `resume_from_checkpoint` instead. +2024-07-30 02:08:14,545 - mindformers[mindformers/trainer/trainer.py:1004] - INFO - ..........Init Model.......... +2024-07-30 02:08:14,546 - mindformers[mindformers/trainer/base_trainer.py:176] - INFO - The current parallel mode is semi_auto_parallel, full batch is True,so global batch size will be changed: global_batch_size = batch_size * data_parallel * micro_batch_interleave_num * gradient_accumulation_steps = 32 = 32 * 1 * 1 * 1 +2024-07-30 02:08:14,546 - mindformers[mindformers/trainer/base_trainer.py:624] - INFO - .........Build Dataset For Train.......... +2024-07-30 02:08:14,546 - mindformers[mindformers/trainer/base_trainer.py:353] - INFO - .........Build Dataset From Config.......... +2024-07-30 02:08:14,546 - mindformers[mindformers/dataset/causal_language_model_dataset.py:166] - INFO - Now Create Causal Language Model Dataset. +2024-07-30 02:08:14,553 - mindformers[mindformers/trainer/base_trainer.py:626] - INFO - Create train dataset finish, dataset size:3125 +2024-07-30 02:08:14,553 - mindformers[mindformers/trainer/utils.py:171] - INFO - Will be Training epochs:3, sink_size:2 +2024-07-30 02:08:14,553 - mindformers[mindformers/trainer/utils.py:173] - INFO - Create training dataset finish, dataset size:3125 +2024-07-30 02:08:14,554 - mindformers[mindformers/trainer/base_trainer.py:656] - INFO - .........Build Net For Train.......... +2024-07-30 02:08:14,554 - mindformers[mindformers/trainer/base_trainer.py:387] - INFO - .........Build Network From Config.......... +2024-07-30 02:08:14,555 - mindformers[mindformers/version_control.py:61] - INFO - The Cell Reuse compilation acceleration feature is not supported when the environment variable ENABLE_CELL_REUSE is 0 or MindSpore version is earlier than 2.1.0 or stand_alone mode or pipeline_stages <= 1 +2024-07-30 02:08:14,556 - mindformers[mindformers/version_control.py:65] - INFO - +The current ENABLE_CELL_REUSE=0, please set the environment variable as follows: +export ENABLE_CELL_REUSE=1 to enable the Cell Reuse compilation acceleration feature. +2024-07-30 02:08:14,556 - mindformers[mindformers/version_control.py:74] - INFO - The Cell Reuse compilation acceleration feature only works in pipeline parallel mode(pipeline_stage>1).Current pipeline stage=1, the feature is disabled by default. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:08:14.558.155 [/home/ma-user/work/mindformers/mindformers/modules/transformer/op_parallel_config.py:244] The optimizer shard True in auto_parallel_context is not equal to the optimizer_shard None in the OpParallelConfig. Please check the optimizer_shard to make them consistent. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:08:14.560.878 [/home/ma-user/work/mindformers/mindformers/modules/transformer/op_parallel_config.py:244] The optimizer shard True in auto_parallel_context is not equal to the optimizer_shard None in the OpParallelConfig. Please check the optimizer_shard to make them consistent. +2024-07-30 02:08:14,665 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:08:14.667.080 [mindspore/common/_decorator.py:40] 'Parameter' is deprecated from version 2.3 and will be removed in a future version, use 'add_pipeline_stage' instead. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:08:14.667.222 [mindspore/common/parameter.py:806] This interface may be deleted in the future. +2024-07-30 02:08:14,687 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,708 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,729 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,750 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,771 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,792 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,813 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,834 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:14,856 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 02:08:15,337 - mindformers[mindformers/models/modeling_utils.py:1438] - INFO - model built, but weights is unloaded, since the config has no checkpoint_name_or_path attribute or checkpoint_name_or_path is None. +2024-07-30 02:08:15,542 - mindformers[mindformers/models/modeling_utils.py:1438] - INFO - model built, but weights is unloaded, since the config has no checkpoint_name_or_path attribute or checkpoint_name_or_path is None. +2024-07-30 02:08:15,564 - mindformers[mindformers/trainer/base_trainer.py:543] - INFO - Network Parameters: 3407872. +2024-07-30 02:08:15,565 - mindformers[mindformers/trainer/base_trainer.py:678] - INFO - .........Build Optimizer For Train.......... +2024-07-30 02:08:15,565 - mindformers[mindformers/trainer/base_trainer.py:426] - INFO - .........Build Optimizer From Config.......... +2024-07-30 02:08:15,565 - mindformers[mindformers/trainer/base_trainer.py:459] - INFO - .........Build LR Schedule From Config.......... +2024-07-30 02:08:15,571 - mindformers[mindformers/trainer/optimizer_grouped_parameters.py:74] - WARNING - dynamic_lr_schedule will be reset and invalid when layer_scale is False. +2024-07-30 02:08:15,575 - mindformers[mindformers/trainer/optimizer_grouped_parameters.py:113] - INFO - Param groups = { + "decay": { + "weight_decay": 0.0, + "params": [ + "model.layers.0.attention.wq.mindpet_delta_lora_a", + "model.layers.0.attention.wq.mindpet_delta_lora_b", + "model.layers.0.attention.wv.mindpet_delta_lora_a", + "model.layers.0.attention.wv.mindpet_delta_lora_b", + "model.layers.1.attention.wq.mindpet_delta_lora_a", + "model.layers.1.attention.wq.mindpet_delta_lora_b", + "model.layers.1.attention.wv.mindpet_delta_lora_a", + "model.layers.1.attention.wv.mindpet_delta_lora_b", + "model.layers.2.attention.wq.mindpet_delta_lora_a", + "model.layers.2.attention.wq.mindpet_delta_lora_b", + "model.layers.2.attention.wv.mindpet_delta_lora_a", + "model.layers.2.attention.wv.mindpet_delta_lora_b", + "model.layers.3.attention.wq.mindpet_delta_lora_a", + "model.layers.3.attention.wq.mindpet_delta_lora_b", + "model.layers.3.attention.wv.mindpet_delta_lora_a", + "model.layers.3.attention.wv.mindpet_delta_lora_b", + "model.layers.4.attention.wq.mindpet_delta_lora_a", + "model.layers.4.attention.wq.mindpet_delta_lora_b", + "model.layers.4.attention.wv.mindpet_delta_lora_a", + "model.layers.4.attention.wv.mindpet_delta_lora_b", + "model.layers.5.attention.wq.mindpet_delta_lora_a", + "model.layers.5.attention.wq.mindpet_delta_lora_b", + "model.layers.5.attention.wv.mindpet_delta_lora_a", + "model.layers.5.attention.wv.mindpet_delta_lora_b", + "model.layers.6.attention.wq.mindpet_delta_lora_a", + "model.layers.6.attention.wq.mindpet_delta_lora_b", + "model.layers.6.attention.wv.mindpet_delta_lora_a", + "model.layers.6.attention.wv.mindpet_delta_lora_b", + "model.layers.7.attention.wq.mindpet_delta_lora_a", + "model.layers.7.attention.wq.mindpet_delta_lora_b", + "model.layers.7.attention.wv.mindpet_delta_lora_a", + "model.layers.7.attention.wv.mindpet_delta_lora_b", + "model.layers.8.attention.wq.mindpet_delta_lora_a", + "model.layers.8.attention.wq.mindpet_delta_lora_b", + "model.layers.8.attention.wv.mindpet_delta_lora_a", + "model.layers.8.attention.wv.mindpet_delta_lora_b", + "model.layers.9.attention.wq.mindpet_delta_lora_a", + "model.layers.9.attention.wq.mindpet_delta_lora_b", + "model.layers.9.attention.wv.mindpet_delta_lora_a", + "model.layers.9.attention.wv.mindpet_delta_lora_b", + "model.layers.10.attention.wq.mindpet_delta_lora_a", + "model.layers.10.attention.wq.mindpet_delta_lora_b", + "model.layers.10.attention.wv.mindpet_delta_lora_a", + "model.layers.10.attention.wv.mindpet_delta_lora_b", + "model.layers.11.attention.wq.mindpet_delta_lora_a", + "model.layers.11.attention.wq.mindpet_delta_lora_b", + "model.layers.11.attention.wv.mindpet_delta_lora_a", + "model.layers.11.attention.wv.mindpet_delta_lora_b", + "model.layers.12.attention.wq.mindpet_delta_lora_a", + "model.layers.12.attention.wq.mindpet_delta_lora_b", + "model.layers.12.attention.wv.mindpet_delta_lora_a", + "model.layers.12.attention.wv.mindpet_delta_lora_b", + "model.layers.13.attention.wq.mindpet_delta_lora_a", + "model.layers.13.attention.wq.mindpet_delta_lora_b", + "model.layers.13.attention.wv.mindpet_delta_lora_a", + "model.layers.13.attention.wv.mindpet_delta_lora_b", + "model.layers.14.attention.wq.mindpet_delta_lora_a", + "model.layers.14.attention.wq.mindpet_delta_lora_b", + "model.layers.14.attention.wv.mindpet_delta_lora_a", + "model.layers.14.attention.wv.mindpet_delta_lora_b", + "model.layers.15.attention.wq.mindpet_delta_lora_a", + "model.layers.15.attention.wq.mindpet_delta_lora_b", + "model.layers.15.attention.wv.mindpet_delta_lora_a", + "model.layers.15.attention.wv.mindpet_delta_lora_b", + "model.layers.16.attention.wq.mindpet_delta_lora_a", + "model.layers.16.attention.wq.mindpet_delta_lora_b", + "model.layers.16.attention.wv.mindpet_delta_lora_a", + "model.layers.16.attention.wv.mindpet_delta_lora_b", + "model.layers.17.attention.wq.mindpet_delta_lora_a", + "model.layers.17.attention.wq.mindpet_delta_lora_b", + "model.layers.17.attention.wv.mindpet_delta_lora_a", + "model.layers.17.attention.wv.mindpet_delta_lora_b", + "model.layers.18.attention.wq.mindpet_delta_lora_a", + "model.layers.18.attention.wq.mindpet_delta_lora_b", + "model.layers.18.attention.wv.mindpet_delta_lora_a", + "model.layers.18.attention.wv.mindpet_delta_lora_b", + "model.layers.19.attention.wq.mindpet_delta_lora_a", + "model.layers.19.attention.wq.mindpet_delta_lora_b", + "model.layers.19.attention.wv.mindpet_delta_lora_a", + "model.layers.19.attention.wv.mindpet_delta_lora_b", + "model.layers.20.attention.wq.mindpet_delta_lora_a", + "model.layers.20.attention.wq.mindpet_delta_lora_b", + "model.layers.20.attention.wv.mindpet_delta_lora_a", + "model.layers.20.attention.wv.mindpet_delta_lora_b", + "model.layers.21.attention.wq.mindpet_delta_lora_a", + "model.layers.21.attention.wq.mindpet_delta_lora_b", + "model.layers.21.attention.wv.mindpet_delta_lora_a", + "model.layers.21.attention.wv.mindpet_delta_lora_b", + "model.layers.22.attention.wq.mindpet_delta_lora_a", + "model.layers.22.attention.wq.mindpet_delta_lora_b", + "model.layers.22.attention.wv.mindpet_delta_lora_a", + "model.layers.22.attention.wv.mindpet_delta_lora_b", + "model.layers.23.attention.wq.mindpet_delta_lora_a", + "model.layers.23.attention.wq.mindpet_delta_lora_b", + "model.layers.23.attention.wv.mindpet_delta_lora_a", + "model.layers.23.attention.wv.mindpet_delta_lora_b", + "model.layers.24.attention.wq.mindpet_delta_lora_a", + "model.layers.24.attention.wq.mindpet_delta_lora_b", + "model.layers.24.attention.wv.mindpet_delta_lora_a", + "model.layers.24.attention.wv.mindpet_delta_lora_b", + "model.layers.25.attention.wq.mindpet_delta_lora_a", + "model.layers.25.attention.wq.mindpet_delta_lora_b", + "model.layers.25.attention.wv.mindpet_delta_lora_a", + "model.layers.25.attention.wv.mindpet_delta_lora_b", + "model.layers.26.attention.wq.mindpet_delta_lora_a", + "model.layers.26.attention.wq.mindpet_delta_lora_b", + "model.layers.26.attention.wv.mindpet_delta_lora_a", + "model.layers.26.attention.wv.mindpet_delta_lora_b", + "model.layers.27.attention.wq.mindpet_delta_lora_a", + "model.layers.27.attention.wq.mindpet_delta_lora_b", + "model.layers.27.attention.wv.mindpet_delta_lora_a", + "model.layers.27.attention.wv.mindpet_delta_lora_b", + "model.layers.28.attention.wq.mindpet_delta_lora_a", + "model.layers.28.attention.wq.mindpet_delta_lora_b", + "model.layers.28.attention.wv.mindpet_delta_lora_a", + "model.layers.28.attention.wv.mindpet_delta_lora_b", + "model.layers.29.attention.wq.mindpet_delta_lora_a", + "model.layers.29.attention.wq.mindpet_delta_lora_b", + "model.layers.29.attention.wv.mindpet_delta_lora_a", + "model.layers.29.attention.wv.mindpet_delta_lora_b", + "model.layers.30.attention.wq.mindpet_delta_lora_a", + "model.layers.30.attention.wq.mindpet_delta_lora_b", + "model.layers.30.attention.wv.mindpet_delta_lora_a", + "model.layers.30.attention.wv.mindpet_delta_lora_b", + "model.layers.31.attention.wq.mindpet_delta_lora_a", + "model.layers.31.attention.wq.mindpet_delta_lora_b", + "model.layers.31.attention.wv.mindpet_delta_lora_a", + "model.layers.31.attention.wv.mindpet_delta_lora_b" + ] + } +} +2024-07-30 02:08:15,676 - mindformers[mindformers/trainer/base_trainer.py:683] - INFO - .........Build Running Wrapper From Config For Train.......... +2024-07-30 02:08:15,676 - mindformers[mindformers/trainer/base_trainer.py:496] - INFO - .........Build Model Wrapper for Train From Config.......... +2024-07-30 02:08:15,683 - mindformers[mindformers/trainer/base_trainer.py:687] - INFO - .........Build Callbacks For Train.......... +2024-07-30 02:08:15,684 - mindformers[mindformers/core/callback/callback.py:533] - INFO - Integrated_save is changed to False when using auto_parallel. +2024-07-30 02:08:15,685 - mindformers[mindformers/trainer/base_trainer.py:721] - INFO - .........Starting Init Train Model.......... +2024-07-30 02:08:15,686 - mindformers[mindformers/trainer/utils.py:736] - INFO - ............Start load checkpoint from checkpoint............ +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:09:57.119.262 [mindspore/train/serialization.py:1369] model.tok_embeddings.embedding_weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:02.161.362 [mindspore/train/serialization.py:1369] model.layers.0.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:02.162.059 [mindspore/train/serialization.py:1369] model.layers.0.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:02.162.494 [mindspore/train/serialization.py:1369] model.layers.0.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:02.306.051 [mindspore/train/serialization.py:1369] model.layers.0.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:02.353.352 [mindspore/train/serialization.py:1369] model.layers.0.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:02.395.463 [mindspore/train/serialization.py:1369] model.layers.0.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:02.539.922 [mindspore/train/serialization.py:1369] model.layers.0.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:03.128.753 [mindspore/train/serialization.py:1369] model.layers.0.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:03.726.496 [mindspore/train/serialization.py:1369] model.layers.0.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:04.313.265 [mindspore/train/serialization.py:1369] model.layers.1.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:04.314.055 [mindspore/train/serialization.py:1369] model.layers.1.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:04.314.494 [mindspore/train/serialization.py:1369] model.layers.1.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:04.465.606 [mindspore/train/serialization.py:1369] model.layers.1.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:04.506.378 [mindspore/train/serialization.py:1369] model.layers.1.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:04.545.753 [mindspore/train/serialization.py:1369] model.layers.1.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:04.691.452 [mindspore/train/serialization.py:1369] model.layers.1.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:05.273.029 [mindspore/train/serialization.py:1369] model.layers.1.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:05.851.479 [mindspore/train/serialization.py:1369] model.layers.1.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:06.427.360 [mindspore/train/serialization.py:1369] model.layers.2.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:06.428.193 [mindspore/train/serialization.py:1369] model.layers.2.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:06.428.664 [mindspore/train/serialization.py:1369] model.layers.2.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:06.586.842 [mindspore/train/serialization.py:1369] model.layers.2.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:06.631.625 [mindspore/train/serialization.py:1369] model.layers.2.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:06.674.382 [mindspore/train/serialization.py:1369] model.layers.2.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:06.818.887 [mindspore/train/serialization.py:1369] model.layers.2.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:07.399.870 [mindspore/train/serialization.py:1369] model.layers.2.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:07.969.689 [mindspore/train/serialization.py:1369] model.layers.2.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:08.638.935 [mindspore/train/serialization.py:1369] model.layers.3.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:08.639.760 [mindspore/train/serialization.py:1369] model.layers.3.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:08.640.205 [mindspore/train/serialization.py:1369] model.layers.3.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:08.796.896 [mindspore/train/serialization.py:1369] model.layers.3.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:08.839.856 [mindspore/train/serialization.py:1369] model.layers.3.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:08.880.910 [mindspore/train/serialization.py:1369] model.layers.3.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:09.431.87 [mindspore/train/serialization.py:1369] model.layers.3.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:09.613.503 [mindspore/train/serialization.py:1369] model.layers.3.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:10.188.658 [mindspore/train/serialization.py:1369] model.layers.3.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:10.761.438 [mindspore/train/serialization.py:1369] model.layers.4.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:10.762.274 [mindspore/train/serialization.py:1369] model.layers.4.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:10.762.705 [mindspore/train/serialization.py:1369] model.layers.4.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:10.940.481 [mindspore/train/serialization.py:1369] model.layers.4.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:10.982.869 [mindspore/train/serialization.py:1369] model.layers.4.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:11.238.65 [mindspore/train/serialization.py:1369] model.layers.4.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:11.190.215 [mindspore/train/serialization.py:1369] model.layers.4.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:11.764.704 [mindspore/train/serialization.py:1369] model.layers.4.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:12.455.699 [mindspore/train/serialization.py:1369] model.layers.4.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:13.307.83 [mindspore/train/serialization.py:1369] model.layers.5.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:13.315.94 [mindspore/train/serialization.py:1369] model.layers.5.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:13.320.40 [mindspore/train/serialization.py:1369] model.layers.5.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:13.191.096 [mindspore/train/serialization.py:1369] model.layers.5.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:13.238.962 [mindspore/train/serialization.py:1369] model.layers.5.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:13.280.381 [mindspore/train/serialization.py:1369] model.layers.5.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:13.455.967 [mindspore/train/serialization.py:1369] model.layers.5.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:14.495.26 [mindspore/train/serialization.py:1369] model.layers.5.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:14.624.602 [mindspore/train/serialization.py:1369] model.layers.5.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:15.261.261 [mindspore/train/serialization.py:1369] model.layers.6.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:15.262.077 [mindspore/train/serialization.py:1369] model.layers.6.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:15.262.505 [mindspore/train/serialization.py:1369] model.layers.6.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:15.455.173 [mindspore/train/serialization.py:1369] model.layers.6.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:15.511.780 [mindspore/train/serialization.py:1369] model.layers.6.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:15.552.165 [mindspore/train/serialization.py:1369] model.layers.6.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:15.717.358 [mindspore/train/serialization.py:1369] model.layers.6.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:16.280.978 [mindspore/train/serialization.py:1369] model.layers.6.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:16.849.363 [mindspore/train/serialization.py:1369] model.layers.6.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:17.435.057 [mindspore/train/serialization.py:1369] model.layers.7.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:17.435.863 [mindspore/train/serialization.py:1369] model.layers.7.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:17.436.316 [mindspore/train/serialization.py:1369] model.layers.7.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:17.600.273 [mindspore/train/serialization.py:1369] model.layers.7.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:17.653.821 [mindspore/train/serialization.py:1369] model.layers.7.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:17.701.575 [mindspore/train/serialization.py:1369] model.layers.7.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:17.867.549 [mindspore/train/serialization.py:1369] model.layers.7.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:18.433.390 [mindspore/train/serialization.py:1369] model.layers.7.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:19.166.93 [mindspore/train/serialization.py:1369] model.layers.7.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:19.583.460 [mindspore/train/serialization.py:1369] model.layers.8.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:19.584.266 [mindspore/train/serialization.py:1369] model.layers.8.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:19.584.743 [mindspore/train/serialization.py:1369] model.layers.8.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:19.750.966 [mindspore/train/serialization.py:1369] model.layers.8.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:19.800.666 [mindspore/train/serialization.py:1369] model.layers.8.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:19.848.676 [mindspore/train/serialization.py:1369] model.layers.8.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:20.128.17 [mindspore/train/serialization.py:1369] model.layers.8.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:20.576.822 [mindspore/train/serialization.py:1369] model.layers.8.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:21.164.918 [mindspore/train/serialization.py:1369] model.layers.8.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:21.742.805 [mindspore/train/serialization.py:1369] model.layers.9.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:21.743.639 [mindspore/train/serialization.py:1369] model.layers.9.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:21.744.098 [mindspore/train/serialization.py:1369] model.layers.9.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:21.933.293 [mindspore/train/serialization.py:1369] model.layers.9.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:21.981.211 [mindspore/train/serialization.py:1369] model.layers.9.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:22.309.24 [mindspore/train/serialization.py:1369] model.layers.9.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:22.235.298 [mindspore/train/serialization.py:1369] model.layers.9.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:22.844.776 [mindspore/train/serialization.py:1369] model.layers.9.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:23.459.802 [mindspore/train/serialization.py:1369] model.layers.9.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:24.402.32 [mindspore/train/serialization.py:1369] model.layers.10.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:24.411.39 [mindspore/train/serialization.py:1369] model.layers.10.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:24.415.85 [mindspore/train/serialization.py:1369] model.layers.10.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:24.297.622 [mindspore/train/serialization.py:1369] model.layers.10.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:24.348.287 [mindspore/train/serialization.py:1369] model.layers.10.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:24.414.602 [mindspore/train/serialization.py:1369] model.layers.10.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:24.592.890 [mindspore/train/serialization.py:1369] model.layers.10.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:25.176.437 [mindspore/train/serialization.py:1369] model.layers.10.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:25.780.131 [mindspore/train/serialization.py:1369] model.layers.10.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:26.389.699 [mindspore/train/serialization.py:1369] model.layers.11.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:26.390.587 [mindspore/train/serialization.py:1369] model.layers.11.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:26.391.041 [mindspore/train/serialization.py:1369] model.layers.11.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:26.563.586 [mindspore/train/serialization.py:1369] model.layers.11.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:26.621.190 [mindspore/train/serialization.py:1369] model.layers.11.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:26.685.183 [mindspore/train/serialization.py:1369] model.layers.11.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:26.861.282 [mindspore/train/serialization.py:1369] model.layers.11.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:27.433.141 [mindspore/train/serialization.py:1369] model.layers.11.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:28.821.3 [mindspore/train/serialization.py:1369] model.layers.11.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:28.590.658 [mindspore/train/serialization.py:1369] model.layers.12.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:28.591.474 [mindspore/train/serialization.py:1369] model.layers.12.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:28.591.913 [mindspore/train/serialization.py:1369] model.layers.12.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:28.781.319 [mindspore/train/serialization.py:1369] model.layers.12.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:28.827.786 [mindspore/train/serialization.py:1369] model.layers.12.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:28.877.210 [mindspore/train/serialization.py:1369] model.layers.12.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:29.508.95 [mindspore/train/serialization.py:1369] model.layers.12.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:29.613.572 [mindspore/train/serialization.py:1369] model.layers.12.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:30.174.442 [mindspore/train/serialization.py:1369] model.layers.12.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:30.755.187 [mindspore/train/serialization.py:1369] model.layers.13.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:30.756.008 [mindspore/train/serialization.py:1369] model.layers.13.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:30.756.440 [mindspore/train/serialization.py:1369] model.layers.13.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:30.977.053 [mindspore/train/serialization.py:1369] model.layers.13.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:31.270.84 [mindspore/train/serialization.py:1369] model.layers.13.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:31.921.81 [mindspore/train/serialization.py:1369] model.layers.13.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:31.276.936 [mindspore/train/serialization.py:1369] model.layers.13.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:31.878.804 [mindspore/train/serialization.py:1369] model.layers.13.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:32.493.118 [mindspore/train/serialization.py:1369] model.layers.13.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:33.578.68 [mindspore/train/serialization.py:1369] model.layers.14.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:33.587.54 [mindspore/train/serialization.py:1369] model.layers.14.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:33.592.00 [mindspore/train/serialization.py:1369] model.layers.14.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:33.243.819 [mindspore/train/serialization.py:1369] model.layers.14.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:33.298.962 [mindspore/train/serialization.py:1369] model.layers.14.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:33.371.837 [mindspore/train/serialization.py:1369] model.layers.14.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:33.547.755 [mindspore/train/serialization.py:1369] model.layers.14.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:34.119.316 [mindspore/train/serialization.py:1369] model.layers.14.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:34.697.531 [mindspore/train/serialization.py:1369] model.layers.14.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:35.295.575 [mindspore/train/serialization.py:1369] model.layers.15.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:35.296.448 [mindspore/train/serialization.py:1369] model.layers.15.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:35.296.923 [mindspore/train/serialization.py:1369] model.layers.15.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:35.474.429 [mindspore/train/serialization.py:1369] model.layers.15.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:35.522.730 [mindspore/train/serialization.py:1369] model.layers.15.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:35.571.721 [mindspore/train/serialization.py:1369] model.layers.15.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:35.747.694 [mindspore/train/serialization.py:1369] model.layers.15.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:36.322.920 [mindspore/train/serialization.py:1369] model.layers.15.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:36.900.389 [mindspore/train/serialization.py:1369] model.layers.15.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:37.504.455 [mindspore/train/serialization.py:1369] model.layers.16.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:37.505.320 [mindspore/train/serialization.py:1369] model.layers.16.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:37.505.761 [mindspore/train/serialization.py:1369] model.layers.16.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:37.681.377 [mindspore/train/serialization.py:1369] model.layers.16.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:37.728.861 [mindspore/train/serialization.py:1369] model.layers.16.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:37.779.048 [mindspore/train/serialization.py:1369] model.layers.16.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:37.963.568 [mindspore/train/serialization.py:1369] model.layers.16.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:38.570.171 [mindspore/train/serialization.py:1369] model.layers.16.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:39.190.558 [mindspore/train/serialization.py:1369] model.layers.16.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:39.777.625 [mindspore/train/serialization.py:1369] model.layers.17.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:39.778.424 [mindspore/train/serialization.py:1369] model.layers.17.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:39.778.860 [mindspore/train/serialization.py:1369] model.layers.17.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:40.117.80 [mindspore/train/serialization.py:1369] model.layers.17.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:40.728.85 [mindspore/train/serialization.py:1369] model.layers.17.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:40.140.371 [mindspore/train/serialization.py:1369] model.layers.17.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:40.319.531 [mindspore/train/serialization.py:1369] model.layers.17.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:40.894.168 [mindspore/train/serialization.py:1369] model.layers.17.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:41.474.451 [mindspore/train/serialization.py:1369] model.layers.17.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:42.681.62 [mindspore/train/serialization.py:1369] model.layers.18.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:42.689.81 [mindspore/train/serialization.py:1369] model.layers.18.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:42.694.28 [mindspore/train/serialization.py:1369] model.layers.18.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:42.245.394 [mindspore/train/serialization.py:1369] model.layers.18.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:42.296.996 [mindspore/train/serialization.py:1369] model.layers.18.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:42.365.169 [mindspore/train/serialization.py:1369] model.layers.18.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:42.542.646 [mindspore/train/serialization.py:1369] model.layers.18.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:43.116.096 [mindspore/train/serialization.py:1369] model.layers.18.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:43.688.292 [mindspore/train/serialization.py:1369] model.layers.18.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:44.302.422 [mindspore/train/serialization.py:1369] model.layers.19.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:44.303.283 [mindspore/train/serialization.py:1369] model.layers.19.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:44.303.716 [mindspore/train/serialization.py:1369] model.layers.19.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:44.477.069 [mindspore/train/serialization.py:1369] model.layers.19.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:44.525.464 [mindspore/train/serialization.py:1369] model.layers.19.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:44.574.556 [mindspore/train/serialization.py:1369] model.layers.19.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:44.749.685 [mindspore/train/serialization.py:1369] model.layers.19.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:45.311.990 [mindspore/train/serialization.py:1369] model.layers.19.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:45.938.869 [mindspore/train/serialization.py:1369] model.layers.19.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:46.552.333 [mindspore/train/serialization.py:1369] model.layers.20.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:46.553.250 [mindspore/train/serialization.py:1369] model.layers.20.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:46.553.688 [mindspore/train/serialization.py:1369] model.layers.20.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:46.768.036 [mindspore/train/serialization.py:1369] model.layers.20.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:46.818.102 [mindspore/train/serialization.py:1369] model.layers.20.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:46.869.664 [mindspore/train/serialization.py:1369] model.layers.20.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:47.472.30 [mindspore/train/serialization.py:1369] model.layers.20.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:47.654.751 [mindspore/train/serialization.py:1369] model.layers.20.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:48.237.399 [mindspore/train/serialization.py:1369] model.layers.20.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:48.893.749 [mindspore/train/serialization.py:1369] model.layers.21.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:48.894.528 [mindspore/train/serialization.py:1369] model.layers.21.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:48.894.953 [mindspore/train/serialization.py:1369] model.layers.21.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:49.120.815 [mindspore/train/serialization.py:1369] model.layers.21.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:49.169.260 [mindspore/train/serialization.py:1369] model.layers.21.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:49.216.611 [mindspore/train/serialization.py:1369] model.layers.21.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:49.400.502 [mindspore/train/serialization.py:1369] model.layers.21.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:49.988.021 [mindspore/train/serialization.py:1369] model.layers.21.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:50.570.370 [mindspore/train/serialization.py:1369] model.layers.21.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:51.149.549 [mindspore/train/serialization.py:1369] model.layers.22.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:51.150.394 [mindspore/train/serialization.py:1369] model.layers.22.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:51.150.846 [mindspore/train/serialization.py:1369] model.layers.22.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:51.326.089 [mindspore/train/serialization.py:1369] model.layers.22.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:51.381.289 [mindspore/train/serialization.py:1369] model.layers.22.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:51.430.101 [mindspore/train/serialization.py:1369] model.layers.22.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:51.606.462 [mindspore/train/serialization.py:1369] model.layers.22.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:52.201.940 [mindspore/train/serialization.py:1369] model.layers.22.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:52.801.840 [mindspore/train/serialization.py:1369] model.layers.22.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:53.402.098 [mindspore/train/serialization.py:1369] model.layers.23.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:53.402.957 [mindspore/train/serialization.py:1369] model.layers.23.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:53.403.401 [mindspore/train/serialization.py:1369] model.layers.23.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:53.583.978 [mindspore/train/serialization.py:1369] model.layers.23.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:53.631.518 [mindspore/train/serialization.py:1369] model.layers.23.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:53.680.424 [mindspore/train/serialization.py:1369] model.layers.23.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:53.857.173 [mindspore/train/serialization.py:1369] model.layers.23.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:54.461.303 [mindspore/train/serialization.py:1369] model.layers.23.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:55.486.52 [mindspore/train/serialization.py:1369] model.layers.23.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:55.649.087 [mindspore/train/serialization.py:1369] model.layers.24.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:55.649.971 [mindspore/train/serialization.py:1369] model.layers.24.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:55.650.421 [mindspore/train/serialization.py:1369] model.layers.24.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:55.892.262 [mindspore/train/serialization.py:1369] model.layers.24.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:55.954.185 [mindspore/train/serialization.py:1369] model.layers.24.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:56.100.1 [mindspore/train/serialization.py:1369] model.layers.24.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:56.175.056 [mindspore/train/serialization.py:1369] model.layers.24.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:56.791.299 [mindspore/train/serialization.py:1369] model.layers.24.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:57.353.835 [mindspore/train/serialization.py:1369] model.layers.24.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:57.951.563 [mindspore/train/serialization.py:1369] model.layers.25.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:57.952.480 [mindspore/train/serialization.py:1369] model.layers.25.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:57.952.985 [mindspore/train/serialization.py:1369] model.layers.25.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:58.160.320 [mindspore/train/serialization.py:1369] model.layers.25.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:58.215.653 [mindspore/train/serialization.py:1369] model.layers.25.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:58.289.902 [mindspore/train/serialization.py:1369] model.layers.25.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:58.473.073 [mindspore/train/serialization.py:1369] model.layers.25.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:59.690.09 [mindspore/train/serialization.py:1369] model.layers.25.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:10:59.672.971 [mindspore/train/serialization.py:1369] model.layers.25.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:00.262.422 [mindspore/train/serialization.py:1369] model.layers.26.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:00.263.383 [mindspore/train/serialization.py:1369] model.layers.26.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:00.263.838 [mindspore/train/serialization.py:1369] model.layers.26.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:00.441.391 [mindspore/train/serialization.py:1369] model.layers.26.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:00.492.557 [mindspore/train/serialization.py:1369] model.layers.26.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:00.545.696 [mindspore/train/serialization.py:1369] model.layers.26.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:00.722.060 [mindspore/train/serialization.py:1369] model.layers.26.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:01.325.741 [mindspore/train/serialization.py:1369] model.layers.26.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:01.916.355 [mindspore/train/serialization.py:1369] model.layers.26.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:02.513.088 [mindspore/train/serialization.py:1369] model.layers.27.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:02.513.919 [mindspore/train/serialization.py:1369] model.layers.27.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:02.514.370 [mindspore/train/serialization.py:1369] model.layers.27.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:02.692.947 [mindspore/train/serialization.py:1369] model.layers.27.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:02.741.555 [mindspore/train/serialization.py:1369] model.layers.27.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:02.789.966 [mindspore/train/serialization.py:1369] model.layers.27.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:02.971.760 [mindspore/train/serialization.py:1369] model.layers.27.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:03.563.466 [mindspore/train/serialization.py:1369] model.layers.27.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:04.163.028 [mindspore/train/serialization.py:1369] model.layers.27.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:04.734.127 [mindspore/train/serialization.py:1369] model.layers.28.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:04.734.959 [mindspore/train/serialization.py:1369] model.layers.28.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:04.735.399 [mindspore/train/serialization.py:1369] model.layers.28.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:04.978.046 [mindspore/train/serialization.py:1369] model.layers.28.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:05.292.35 [mindspore/train/serialization.py:1369] model.layers.28.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:05.808.37 [mindspore/train/serialization.py:1369] model.layers.28.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:05.265.630 [mindspore/train/serialization.py:1369] model.layers.28.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:05.838.904 [mindspore/train/serialization.py:1369] model.layers.28.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:06.407.608 [mindspore/train/serialization.py:1369] model.layers.28.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:07.325.95 [mindspore/train/serialization.py:1369] model.layers.29.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:07.334.05 [mindspore/train/serialization.py:1369] model.layers.29.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:07.338.44 [mindspore/train/serialization.py:1369] model.layers.29.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:07.211.527 [mindspore/train/serialization.py:1369] model.layers.29.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:07.261.012 [mindspore/train/serialization.py:1369] model.layers.29.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:07.314.621 [mindspore/train/serialization.py:1369] model.layers.29.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:07.496.464 [mindspore/train/serialization.py:1369] model.layers.29.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:08.101.233 [mindspore/train/serialization.py:1369] model.layers.29.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:08.713.265 [mindspore/train/serialization.py:1369] model.layers.29.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:09.292.348 [mindspore/train/serialization.py:1369] model.layers.30.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:09.293.149 [mindspore/train/serialization.py:1369] model.layers.30.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:09.293.580 [mindspore/train/serialization.py:1369] model.layers.30.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:09.517.935 [mindspore/train/serialization.py:1369] model.layers.30.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:09.569.623 [mindspore/train/serialization.py:1369] model.layers.30.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:09.678.830 [mindspore/train/serialization.py:1369] model.layers.30.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:09.872.757 [mindspore/train/serialization.py:1369] model.layers.30.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:10.478.150 [mindspore/train/serialization.py:1369] model.layers.30.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:11.833.85 [mindspore/train/serialization.py:1369] model.layers.30.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:11.670.766 [mindspore/train/serialization.py:1369] model.layers.31.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:11.671.639 [mindspore/train/serialization.py:1369] model.layers.31.attention_norm.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:11.672.084 [mindspore/train/serialization.py:1369] model.layers.31.attention.wq.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:11.861.753 [mindspore/train/serialization.py:1369] model.layers.31.attention.wk.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:12.336.26 [mindspore/train/serialization.py:1369] model.layers.31.attention.wv.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:12.149.805 [mindspore/train/serialization.py:1369] model.layers.31.attention.wo.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:12.327.379 [mindspore/train/serialization.py:1369] model.layers.31.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:12.915.672 [mindspore/train/serialization.py:1369] model.layers.31.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:13.500.625 [mindspore/train/serialization.py:1369] model.layers.31.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:14.109.732 [mindspore/train/serialization.py:1369] model.norm_out.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:14.110.561 [mindspore/train/serialization.py:1369] lm_head.weight is not init while load ckpt. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:39.700.36 [mindspore/train/serialization.py:195] The type of model.layers.0.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:39.744.43 [mindspore/train/serialization.py:195] The type of model.layers.0.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:46.122.302 [mindspore/train/serialization.py:195] The type of model.layers.1.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:46.126.094 [mindspore/train/serialization.py:195] The type of model.layers.1.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:53.150.818 [mindspore/train/serialization.py:195] The type of model.layers.2.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:11:53.154.627 [mindspore/train/serialization.py:195] The type of model.layers.2.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:12:00.172.602 [mindspore/train/serialization.py:195] The type of model.layers.3.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:12:00.176.355 [mindspore/train/serialization.py:195] The type of model.layers.3.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:12:07.147.121 [mindspore/train/serialization.py:195] The type of model.layers.4.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:12:07.151.027 [mindspore/train/serialization.py:195] The type of model.layers.4.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:12:14.982.09 [mindspore/train/serialization.py:195] The type of model.layers.5.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:12:14.102.173 [mindspore/train/serialization.py:195] The type of model.layers.5.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:12:21.887.45 [mindspore/train/serialization.py:195] The type of model.layers.6.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:12:21.926.08 [mindspore/train/serialization.py:195] The type of model.layers.6.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:12:28.527.05 [mindspore/train/serialization.py:195] The type of model.layers.7.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:12:28.564.94 [mindspore/train/serialization.py:195] The type of model.layers.7.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:12:35.336.64 [mindspore/train/serialization.py:195] The type of model.layers.8.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:12:35.375.69 [mindspore/train/serialization.py:195] The type of model.layers.8.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:12:41.966.944 [mindspore/train/serialization.py:195] The type of model.layers.9.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:12:41.970.882 [mindspore/train/serialization.py:195] The type of model.layers.9.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:12:48.987.700 [mindspore/train/serialization.py:195] The type of model.layers.10.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:12:48.991.649 [mindspore/train/serialization.py:195] The type of model.layers.10.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:12:55.945.189 [mindspore/train/serialization.py:195] The type of model.layers.11.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:12:55.948.992 [mindspore/train/serialization.py:195] The type of model.layers.11.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:13:02.879.806 [mindspore/train/serialization.py:195] The type of model.layers.12.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:13:02.883.799 [mindspore/train/serialization.py:195] The type of model.layers.12.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:13:09.840.365 [mindspore/train/serialization.py:195] The type of model.layers.13.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:13:09.881.197 [mindspore/train/serialization.py:195] The type of model.layers.13.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:13:16.786.259 [mindspore/train/serialization.py:195] The type of model.layers.14.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:13:16.790.208 [mindspore/train/serialization.py:195] The type of model.layers.14.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:13:23.743.572 [mindspore/train/serialization.py:195] The type of model.layers.15.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:13:23.747.397 [mindspore/train/serialization.py:195] The type of model.layers.15.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:13:30.694.247 [mindspore/train/serialization.py:195] The type of model.layers.16.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:13:30.698.416 [mindspore/train/serialization.py:195] The type of model.layers.16.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:13:37.714.018 [mindspore/train/serialization.py:195] The type of model.layers.17.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:13:37.717.888 [mindspore/train/serialization.py:195] The type of model.layers.17.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:13:44.666.985 [mindspore/train/serialization.py:195] The type of model.layers.18.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:13:44.670.967 [mindspore/train/serialization.py:195] The type of model.layers.18.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:13:51.606.206 [mindspore/train/serialization.py:195] The type of model.layers.19.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:13:51.610.083 [mindspore/train/serialization.py:195] The type of model.layers.19.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:13:58.571.781 [mindspore/train/serialization.py:195] The type of model.layers.20.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:13:58.575.861 [mindspore/train/serialization.py:195] The type of model.layers.20.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:14:05.594.478 [mindspore/train/serialization.py:195] The type of model.layers.21.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:14:05.598.318 [mindspore/train/serialization.py:195] The type of model.layers.21.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:14:12.571.150 [mindspore/train/serialization.py:195] The type of model.layers.22.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:14:12.575.059 [mindspore/train/serialization.py:195] The type of model.layers.22.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:14:19.580.866 [mindspore/train/serialization.py:195] The type of model.layers.23.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:14:19.584.715 [mindspore/train/serialization.py:195] The type of model.layers.23.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:14:26.528.325 [mindspore/train/serialization.py:195] The type of model.layers.24.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:14:26.532.414 [mindspore/train/serialization.py:195] The type of model.layers.24.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:14:33.571.352 [mindspore/train/serialization.py:195] The type of model.layers.25.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:14:33.575.199 [mindspore/train/serialization.py:195] The type of model.layers.25.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:14:40.576.614 [mindspore/train/serialization.py:195] The type of model.layers.26.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:14:40.580.593 [mindspore/train/serialization.py:195] The type of model.layers.26.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:14:47.570.481 [mindspore/train/serialization.py:195] The type of model.layers.27.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:14:47.574.308 [mindspore/train/serialization.py:195] The type of model.layers.27.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:14:54.642.886 [mindspore/train/serialization.py:195] The type of model.layers.28.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:14:54.647.041 [mindspore/train/serialization.py:195] The type of model.layers.28.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:15:01.750.488 [mindspore/train/serialization.py:195] The type of model.layers.29.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:15:01.754.330 [mindspore/train/serialization.py:195] The type of model.layers.29.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:15:08.807.518 [mindspore/train/serialization.py:195] The type of model.layers.30.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:15:08.811.453 [mindspore/train/serialization.py:195] The type of model.layers.30.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:15:15.925.427 [mindspore/train/serialization.py:195] The type of model.layers.31.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:15:15.929.425 [mindspore/train/serialization.py:195] The type of model.layers.31.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:15:23.483.82 [mindspore/train/serialization.py:195] The type of model.norm_out.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:15:40.522.007 [mindspore/train/serialization.py:1456] For 'load_param_into_net', 128 parameters in the 'net' are not loaded, because they are not in the 'parameter_dict', please check whether the network structure is consistent when training and loading checkpoint. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:15:40.522.471 [mindspore/train/serialization.py:1460] ['model.layers.0.attention.wq.mindpet_delta_lora_a', 'model.layers.0.attention.wq.mindpet_delta_lora_b', 'model.layers.0.attention.wv.mindpet_delta_lora_a', 'model.layers.0.attention.wv.mindpet_delta_lora_b', 'model.layers.1.attention.wq.mindpet_delta_lora_a', 'model.layers.1.attention.wq.mindpet_delta_lora_b', 'model.layers.1.attention.wv.mindpet_delta_lora_a', 'model.layers.1.attention.wv.mindpet_delta_lora_b', 'model.layers.2.attention.wq.mindpet_delta_lora_a', 'model.layers.2.attention.wq.mindpet_delta_lora_b', 'model.layers.2.attention.wv.mindpet_delta_lora_a', 'model.layers.2.attention.wv.mindpet_delta_lora_b', 'model.layers.3.attention.wq.mindpet_delta_lora_a', 'model.layers.3.attention.wq.mindpet_delta_lora_b', 'model.layers.3.attention.wv.mindpet_delta_lora_a', 'model.layers.3.attention.wv.mindpet_delta_lora_b', 'model.layers.4.attention.wq.mindpet_delta_lora_a', 'model.layers.4.attention.wq.mindpet_delta_lora_b', 'model.layers.4.attention.wv.mindpet_delta_lora_a', 'model.layers.4.attention.wv.mindpet_delta_lora_b', 'model.layers.5.attention.wq.mindpet_delta_lora_a', 'model.layers.5.attention.wq.mindpet_delta_lora_b', 'model.layers.5.attention.wv.mindpet_delta_lora_a', 'model.layers.5.attention.wv.mindpet_delta_lora_b', 'model.layers.6.attention.wq.mindpet_delta_lora_a', 'model.layers.6.attention.wq.mindpet_delta_lora_b', 'model.layers.6.attention.wv.mindpet_delta_lora_a', 'model.layers.6.attention.wv.mindpet_delta_lora_b', 'model.layers.7.attention.wq.mindpet_delta_lora_a', 'model.layers.7.attention.wq.mindpet_delta_lora_b', 'model.layers.7.attention.wv.mindpet_delta_lora_a', 'model.layers.7.attention.wv.mindpet_delta_lora_b', 'model.layers.8.attention.wq.mindpet_delta_lora_a', 'model.layers.8.attention.wq.mindpet_delta_lora_b', 'model.layers.8.attention.wv.mindpet_delta_lora_a', 'model.layers.8.attention.wv.mindpet_delta_lora_b', 'model.layers.9.attention.wq.mindpet_delta_lora_a', 'model.layers.9.attention.wq.mindpet_delta_lora_b', 'model.layers.9.attention.wv.mindpet_delta_lora_a', 'model.layers.9.attention.wv.mindpet_delta_lora_b', 'model.layers.10.attention.wq.mindpet_delta_lora_a', 'model.layers.10.attention.wq.mindpet_delta_lora_b', 'model.layers.10.attention.wv.mindpet_delta_lora_a', 'model.layers.10.attention.wv.mindpet_delta_lora_b', 'model.layers.11.attention.wq.mindpet_delta_lora_a', 'model.layers.11.attention.wq.mindpet_delta_lora_b', 'model.layers.11.attention.wv.mindpet_delta_lora_a', 'model.layers.11.attention.wv.mindpet_delta_lora_b', 'model.layers.12.attention.wq.mindpet_delta_lora_a', 'model.layers.12.attention.wq.mindpet_delta_lora_b', 'model.layers.12.attention.wv.mindpet_delta_lora_a', 'model.layers.12.attention.wv.mindpet_delta_lora_b', 'model.layers.13.attention.wq.mindpet_delta_lora_a', 'model.layers.13.attention.wq.mindpet_delta_lora_b', 'model.layers.13.attention.wv.mindpet_delta_lora_a', 'model.layers.13.attention.wv.mindpet_delta_lora_b', 'model.layers.14.attention.wq.mindpet_delta_lora_a', 'model.layers.14.attention.wq.mindpet_delta_lora_b', 'model.layers.14.attention.wv.mindpet_delta_lora_a', 'model.layers.14.attention.wv.mindpet_delta_lora_b', 'model.layers.15.attention.wq.mindpet_delta_lora_a', 'model.layers.15.attention.wq.mindpet_delta_lora_b', 'model.layers.15.attention.wv.mindpet_delta_lora_a', 'model.layers.15.attention.wv.mindpet_delta_lora_b', 'model.layers.16.attention.wq.mindpet_delta_lora_a', 'model.layers.16.attention.wq.mindpet_delta_lora_b', 'model.layers.16.attention.wv.mindpet_delta_lora_a', 'model.layers.16.attention.wv.mindpet_delta_lora_b', 'model.layers.17.attention.wq.mindpet_delta_lora_a', 'model.layers.17.attention.wq.mindpet_delta_lora_b', 'model.layers.17.attention.wv.mindpet_delta_lora_a', 'model.layers.17.attention.wv.mindpet_delta_lora_b', 'model.layers.18.attention.wq.mindpet_delta_lora_a', 'model.layers.18.attention.wq.mindpet_delta_lora_b', 'model.layers.18.attention.wv.mindpet_delta_lora_a', 'model.layers.18.attention.wv.mindpet_delta_lora_b', 'model.layers.19.attention.wq.mindpet_delta_lora_a', 'model.layers.19.attention.wq.mindpet_delta_lora_b', 'model.layers.19.attention.wv.mindpet_delta_lora_a', 'model.layers.19.attention.wv.mindpet_delta_lora_b', 'model.layers.20.attention.wq.mindpet_delta_lora_a', 'model.layers.20.attention.wq.mindpet_delta_lora_b', 'model.layers.20.attention.wv.mindpet_delta_lora_a', 'model.layers.20.attention.wv.mindpet_delta_lora_b', 'model.layers.21.attention.wq.mindpet_delta_lora_a', 'model.layers.21.attention.wq.mindpet_delta_lora_b', 'model.layers.21.attention.wv.mindpet_delta_lora_a', 'model.layers.21.attention.wv.mindpet_delta_lora_b', 'model.layers.22.attention.wq.mindpet_delta_lora_a', 'model.layers.22.attention.wq.mindpet_delta_lora_b', 'model.layers.22.attention.wv.mindpet_delta_lora_a', 'model.layers.22.attention.wv.mindpet_delta_lora_b', 'model.layers.23.attention.wq.mindpet_delta_lora_a', 'model.layers.23.attention.wq.mindpet_delta_lora_b', 'model.layers.23.attention.wv.mindpet_delta_lora_a', 'model.layers.23.attention.wv.mindpet_delta_lora_b', 'model.layers.24.attention.wq.mindpet_delta_lora_a', 'model.layers.24.attention.wq.mindpet_delta_lora_b', 'model.layers.24.attention.wv.mindpet_delta_lora_a', 'model.layers.24.attention.wv.mindpet_delta_lora_b', 'model.layers.25.attention.wq.mindpet_delta_lora_a', 'model.layers.25.attention.wq.mindpet_delta_lora_b', 'model.layers.25.attention.wv.mindpet_delta_lora_a', 'model.layers.25.attention.wv.mindpet_delta_lora_b', 'model.layers.26.attention.wq.mindpet_delta_lora_a', 'model.layers.26.attention.wq.mindpet_delta_lora_b', 'model.layers.26.attention.wv.mindpet_delta_lora_a', 'model.layers.26.attention.wv.mindpet_delta_lora_b', 'model.layers.27.attention.wq.mindpet_delta_lora_a', 'model.layers.27.attention.wq.mindpet_delta_lora_b', 'model.layers.27.attention.wv.mindpet_delta_lora_a', 'model.layers.27.attention.wv.mindpet_delta_lora_b', 'model.layers.28.attention.wq.mindpet_delta_lora_a', 'model.layers.28.attention.wq.mindpet_delta_lora_b', 'model.layers.28.attention.wv.mindpet_delta_lora_a', 'model.layers.28.attention.wv.mindpet_delta_lora_b', 'model.layers.29.attention.wq.mindpet_delta_lora_a', 'model.layers.29.attention.wq.mindpet_delta_lora_b', 'model.layers.29.attention.wv.mindpet_delta_lora_a', 'model.layers.29.attention.wv.mindpet_delta_lora_b', 'model.layers.30.attention.wq.mindpet_delta_lora_a', 'model.layers.30.attention.wq.mindpet_delta_lora_b', 'model.layers.30.attention.wv.mindpet_delta_lora_a', 'model.layers.30.attention.wv.mindpet_delta_lora_b', 'model.layers.31.attention.wq.mindpet_delta_lora_a', 'model.layers.31.attention.wq.mindpet_delta_lora_b', 'model.layers.31.attention.wv.mindpet_delta_lora_a', 'model.layers.31.attention.wv.mindpet_delta_lora_b'] are not loaded. +2024-07-30 02:15:40,522 - mindformers[mindformers/trainer/utils.py:767] - INFO - Network parameters are not loaded: (['model.layers.0.attention.wq.mindpet_delta_lora_a', 'model.layers.0.attention.wq.mindpet_delta_lora_b', 'model.layers.0.attention.wv.mindpet_delta_lora_a', 'model.layers.0.attention.wv.mindpet_delta_lora_b', 'model.layers.1.attention.wq.mindpet_delta_lora_a', 'model.layers.1.attention.wq.mindpet_delta_lora_b', 'model.layers.1.attention.wv.mindpet_delta_lora_a', 'model.layers.1.attention.wv.mindpet_delta_lora_b', 'model.layers.2.attention.wq.mindpet_delta_lora_a', 'model.layers.2.attention.wq.mindpet_delta_lora_b', 'model.layers.2.attention.wv.mindpet_delta_lora_a', 'model.layers.2.attention.wv.mindpet_delta_lora_b', 'model.layers.3.attention.wq.mindpet_delta_lora_a', 'model.layers.3.attention.wq.mindpet_delta_lora_b', 'model.layers.3.attention.wv.mindpet_delta_lora_a', 'model.layers.3.attention.wv.mindpet_delta_lora_b', 'model.layers.4.attention.wq.mindpet_delta_lora_a', 'model.layers.4.attention.wq.mindpet_delta_lora_b', 'model.layers.4.attention.wv.mindpet_delta_lora_a', 'model.layers.4.attention.wv.mindpet_delta_lora_b', 'model.layers.5.attention.wq.mindpet_delta_lora_a', 'model.layers.5.attention.wq.mindpet_delta_lora_b', 'model.layers.5.attention.wv.mindpet_delta_lora_a', 'model.layers.5.attention.wv.mindpet_delta_lora_b', 'model.layers.6.attention.wq.mindpet_delta_lora_a', 'model.layers.6.attention.wq.mindpet_delta_lora_b', 'model.layers.6.attention.wv.mindpet_delta_lora_a', 'model.layers.6.attention.wv.mindpet_delta_lora_b', 'model.layers.7.attention.wq.mindpet_delta_lora_a', 'model.layers.7.attention.wq.mindpet_delta_lora_b', 'model.layers.7.attention.wv.mindpet_delta_lora_a', 'model.layers.7.attention.wv.mindpet_delta_lora_b', 'model.layers.8.attention.wq.mindpet_delta_lora_a', 'model.layers.8.attention.wq.mindpet_delta_lora_b', 'model.layers.8.attention.wv.mindpet_delta_lora_a', 'model.layers.8.attention.wv.mindpet_delta_lora_b', 'model.layers.9.attention.wq.mindpet_delta_lora_a', 'model.layers.9.attention.wq.mindpet_delta_lora_b', 'model.layers.9.attention.wv.mindpet_delta_lora_a', 'model.layers.9.attention.wv.mindpet_delta_lora_b', 'model.layers.10.attention.wq.mindpet_delta_lora_a', 'model.layers.10.attention.wq.mindpet_delta_lora_b', 'model.layers.10.attention.wv.mindpet_delta_lora_a', 'model.layers.10.attention.wv.mindpet_delta_lora_b', 'model.layers.11.attention.wq.mindpet_delta_lora_a', 'model.layers.11.attention.wq.mindpet_delta_lora_b', 'model.layers.11.attention.wv.mindpet_delta_lora_a', 'model.layers.11.attention.wv.mindpet_delta_lora_b', 'model.layers.12.attention.wq.mindpet_delta_lora_a', 'model.layers.12.attention.wq.mindpet_delta_lora_b', 'model.layers.12.attention.wv.mindpet_delta_lora_a', 'model.layers.12.attention.wv.mindpet_delta_lora_b', 'model.layers.13.attention.wq.mindpet_delta_lora_a', 'model.layers.13.attention.wq.mindpet_delta_lora_b', 'model.layers.13.attention.wv.mindpet_delta_lora_a', 'model.layers.13.attention.wv.mindpet_delta_lora_b', 'model.layers.14.attention.wq.mindpet_delta_lora_a', 'model.layers.14.attention.wq.mindpet_delta_lora_b', 'model.layers.14.attention.wv.mindpet_delta_lora_a', 'model.layers.14.attention.wv.mindpet_delta_lora_b', 'model.layers.15.attention.wq.mindpet_delta_lora_a', 'model.layers.15.attention.wq.mindpet_delta_lora_b', 'model.layers.15.attention.wv.mindpet_delta_lora_a', 'model.layers.15.attention.wv.mindpet_delta_lora_b', 'model.layers.16.attention.wq.mindpet_delta_lora_a', 'model.layers.16.attention.wq.mindpet_delta_lora_b', 'model.layers.16.attention.wv.mindpet_delta_lora_a', 'model.layers.16.attention.wv.mindpet_delta_lora_b', 'model.layers.17.attention.wq.mindpet_delta_lora_a', 'model.layers.17.attention.wq.mindpet_delta_lora_b', 'model.layers.17.attention.wv.mindpet_delta_lora_a', 'model.layers.17.attention.wv.mindpet_delta_lora_b', 'model.layers.18.attention.wq.mindpet_delta_lora_a', 'model.layers.18.attention.wq.mindpet_delta_lora_b', 'model.layers.18.attention.wv.mindpet_delta_lora_a', 'model.layers.18.attention.wv.mindpet_delta_lora_b', 'model.layers.19.attention.wq.mindpet_delta_lora_a', 'model.layers.19.attention.wq.mindpet_delta_lora_b', 'model.layers.19.attention.wv.mindpet_delta_lora_a', 'model.layers.19.attention.wv.mindpet_delta_lora_b', 'model.layers.20.attention.wq.mindpet_delta_lora_a', 'model.layers.20.attention.wq.mindpet_delta_lora_b', 'model.layers.20.attention.wv.mindpet_delta_lora_a', 'model.layers.20.attention.wv.mindpet_delta_lora_b', 'model.layers.21.attention.wq.mindpet_delta_lora_a', 'model.layers.21.attention.wq.mindpet_delta_lora_b', 'model.layers.21.attention.wv.mindpet_delta_lora_a', 'model.layers.21.attention.wv.mindpet_delta_lora_b', 'model.layers.22.attention.wq.mindpet_delta_lora_a', 'model.layers.22.attention.wq.mindpet_delta_lora_b', 'model.layers.22.attention.wv.mindpet_delta_lora_a', 'model.layers.22.attention.wv.mindpet_delta_lora_b', 'model.layers.23.attention.wq.mindpet_delta_lora_a', 'model.layers.23.attention.wq.mindpet_delta_lora_b', 'model.layers.23.attention.wv.mindpet_delta_lora_a', 'model.layers.23.attention.wv.mindpet_delta_lora_b', 'model.layers.24.attention.wq.mindpet_delta_lora_a', 'model.layers.24.attention.wq.mindpet_delta_lora_b', 'model.layers.24.attention.wv.mindpet_delta_lora_a', 'model.layers.24.attention.wv.mindpet_delta_lora_b', 'model.layers.25.attention.wq.mindpet_delta_lora_a', 'model.layers.25.attention.wq.mindpet_delta_lora_b', 'model.layers.25.attention.wv.mindpet_delta_lora_a', 'model.layers.25.attention.wv.mindpet_delta_lora_b', 'model.layers.26.attention.wq.mindpet_delta_lora_a', 'model.layers.26.attention.wq.mindpet_delta_lora_b', 'model.layers.26.attention.wv.mindpet_delta_lora_a', 'model.layers.26.attention.wv.mindpet_delta_lora_b', 'model.layers.27.attention.wq.mindpet_delta_lora_a', 'model.layers.27.attention.wq.mindpet_delta_lora_b', 'model.layers.27.attention.wv.mindpet_delta_lora_a', 'model.layers.27.attention.wv.mindpet_delta_lora_b', 'model.layers.28.attention.wq.mindpet_delta_lora_a', 'model.layers.28.attention.wq.mindpet_delta_lora_b', 'model.layers.28.attention.wv.mindpet_delta_lora_a', 'model.layers.28.attention.wv.mindpet_delta_lora_b', 'model.layers.29.attention.wq.mindpet_delta_lora_a', 'model.layers.29.attention.wq.mindpet_delta_lora_b', 'model.layers.29.attention.wv.mindpet_delta_lora_a', 'model.layers.29.attention.wv.mindpet_delta_lora_b', 'model.layers.30.attention.wq.mindpet_delta_lora_a', 'model.layers.30.attention.wq.mindpet_delta_lora_b', 'model.layers.30.attention.wv.mindpet_delta_lora_a', 'model.layers.30.attention.wv.mindpet_delta_lora_b', 'model.layers.31.attention.wq.mindpet_delta_lora_a', 'model.layers.31.attention.wq.mindpet_delta_lora_b', 'model.layers.31.attention.wv.mindpet_delta_lora_a', 'model.layers.31.attention.wv.mindpet_delta_lora_b'], []) +2024-07-30 02:15:40,524 - mindformers[mindformers/trainer/base_trainer.py:770] - INFO - .........Starting Training Model.......... +2024-07-30 02:15:40,524 - mindformers[mindformers/trainer/base_trainer.py:773] - INFO - .........Model Compiling, Please Wait a Moment........... +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:15:40.525.447 [mindspore/train/model.py:1120] For MFLossMonitor callback, {'epoch_begin', 'epoch_end', 'step_begin', 'step_end'} methods may not be supported in later version, Use methods prefixed with 'on_train' or 'on_eval' instead when using customized callbacks. +[WARNING] ME(979001:281473320448016,MainProcess):2024-07-30-02:15:40.525.588 [mindspore/train/model.py:1120] For Local2ObsMonitor callback, {'step_end', 'epoch_end'} methods may not be supported in later version, Use methods prefixed with 'on_train' or 'on_eval' instead when using customized callbacks. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.619.503 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/31-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.620.239 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/30-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.620.919 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/29-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.621.585 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/28-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.622.234 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/27-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.622.922 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/26-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.623.561 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/25-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.624.217 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/24-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.624.891 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/23-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.625.541 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/22-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.626.184 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/21-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.626.824 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/20-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.627.467 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/19-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.628.120 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/18-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.628.783 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/17-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.629.424 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/16-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.630.076 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/15-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.630.731 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/14-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.631.373 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/13-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.632.020 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/12-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.632.696 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/11-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.633.354 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/10-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.633.995 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/9-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.634.648 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/8-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.635.287 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/7-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.635.916 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/6-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.636.563 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/5-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.637.210 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/4-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.637.851 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/3-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.638.510 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/2-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.639.139 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/1-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.639.766 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/0-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.640.213 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/0-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.640.935 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/1-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.641.666 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/2-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.642.396 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/3-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.643.112 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/4-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.643.849 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/5-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.644.595 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/6-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.645.322 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/7-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.646.049 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/8-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.646.761 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/9-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.647.477 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/10-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.648.204 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/11-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.648.936 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/12-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.649.654 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/13-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.650.343 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/14-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.651.053 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/15-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.651.743 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/16-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.652.452 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/17-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.653.166 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/18-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.653.846 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/19-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.654.528 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/20-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.655.231 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/21-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.655.924 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/22-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.656.608 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/23-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.657.294 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/24-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.657.968 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/25-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.658.647 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/26-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.659.328 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/27-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.660.009 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/28-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.660.731 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/29-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.661.406 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/30-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:08.662.039 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/31-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(979001,ffff9d477010,python):2024-07-30-02:16:11.179.384 [mindspore/ccsrc/frontend/parallel/graph_util/graph_utils.cc:68] GetTensorRedistributionFromCNode] Default/network-MFTrainOneStepCell/clip_grad_norm-ClipGradNorm/Sqrt-op0 has no OperatorInfo. +- \ | / - 2024-07-30 02:26:19,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2/ 3125], loss: 1.392, per_step_time: 318393ms, lr: 3.558719e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:19,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.0% | | 0.02513 samples/s/p 34 days, 12:58:23 } +2024-07-30 02:26:23,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 4/ 3125], loss: 1.327, per_step_time: 1428ms, lr: 1.0676156e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:23,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.0% | | 5.59991 samples/s/p 3:43:07 } +2024-07-30 02:26:26,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 6/ 3125], loss: 1.193, per_step_time: 1413ms, lr: 1.7793593e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:26,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.66099 samples/s/p 3:40:40 } +2024-07-30 02:26:28,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 8/ 3125], loss: 1.399, per_step_time: 1416ms, lr: 2.4911031e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:28,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.64597 samples/s/p 3:41:12 } +2024-07-30 02:26:31,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 10/ 3125], loss: 1.360, per_step_time: 1414ms, lr: 3.202847e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:31,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.65556 samples/s/p 3:40:47 } +2024-07-30 02:26:34,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 12/ 3125], loss: 1.379, per_step_time: 1413ms, lr: 3.9145905e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:34,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.65841 samples/s/p 3:40:37 } +2024-07-30 02:26:37,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 14/ 3125], loss: 1.350, per_step_time: 1413ms, lr: 4.6263344e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:37,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.65920 samples/s/p 3:40:32 } +2024-07-30 02:26:40,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 16/ 3125], loss: 1.343, per_step_time: 1413ms, lr: 5.3380785e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:40,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.66085 samples/s/p 3:40:26 } +2024-07-30 02:26:43,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 18/ 3125], loss: 1.049, per_step_time: 1413ms, lr: 6.049822e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:43,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.65788 samples/s/p 3:40:30 } +2024-07-30 02:26:45,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 20/ 3125], loss: 1.286, per_step_time: 1413ms, lr: 6.7615656e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:45,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.65901 samples/s/p 3:40:24 } +2024-07-30 02:26:48,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 22/ 3125], loss: 1.170, per_step_time: 1413ms, lr: 7.473309e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:48,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.65811 samples/s/p 3:40:24 } +2024-07-30 02:26:51,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 24/ 3125], loss: 1.197, per_step_time: 1413ms, lr: 8.185053e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:51,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.66051 samples/s/p 3:40:15 } +2024-07-30 02:26:54,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 26/ 3125], loss: 1.367, per_step_time: 1413ms, lr: 8.896797e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:54,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.65806 samples/s/p 3:40:18 } +2024-07-30 02:26:57,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 28/ 3125], loss: 1.430, per_step_time: 1413ms, lr: 9.608541e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:26:57,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.65815 samples/s/p 3:40:15 } +2024-07-30 02:27:00,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 30/ 3125], loss: 1.447, per_step_time: 1412ms, lr: 1.0320284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:00,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.66195 samples/s/p 3:40:03 } +2024-07-30 02:27:02,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 32/ 3125], loss: 1.653, per_step_time: 1415ms, lr: 1.1032029e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:02,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.65306 samples/s/p 3:40:21 } +2024-07-30 02:27:05,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 34/ 3125], loss: 1.188, per_step_time: 1424ms, lr: 1.1743772e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:05,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.61450 samples/s/p 3:41:49 } +2024-07-30 02:27:08,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 36/ 3125], loss: 1.306, per_step_time: 1414ms, lr: 1.2455515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:08,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.65688 samples/s/p 3:40:07 } +2024-07-30 02:27:11,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 38/ 3125], loss: 1.332, per_step_time: 1413ms, lr: 1.3167258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:11,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.66015 samples/s/p 3:39:56 } +2024-07-30 02:27:14,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 40/ 3125], loss: 1.375, per_step_time: 1416ms, lr: 1.3879004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:14,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.64958 samples/s/p 3:40:18 } +2024-07-30 02:27:17,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 42/ 3125], loss: 1.420, per_step_time: 1413ms, lr: 1.4590747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:17,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.65837 samples/s/p 3:39:55 } +2024-07-30 02:27:19,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 44/ 3125], loss: 1.437, per_step_time: 1412ms, lr: 1.530249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:19,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.66254 samples/s/p 3:39:42 } +2024-07-30 02:27:22,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 46/ 3125], loss: 1.287, per_step_time: 1413ms, lr: 1.6014234e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:22,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.66150 samples/s/p 3:39:42 } +2024-07-30 02:27:25,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 48/ 3125], loss: 1.380, per_step_time: 1414ms, lr: 1.6725978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:25,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.65759 samples/s/p 3:39:48 } +2024-07-30 02:27:28,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 50/ 3125], loss: 1.100, per_step_time: 1413ms, lr: 1.7437721e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:28,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.65805 samples/s/p 3:39:44 } +2024-07-30 02:27:31,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 52/ 3125], loss: 1.361, per_step_time: 1413ms, lr: 1.8149465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:31,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.66000 samples/s/p 3:39:37 } +2024-07-30 02:27:34,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 54/ 3125], loss: 1.508, per_step_time: 1413ms, lr: 1.886121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:34,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.65842 samples/s/p 3:39:38 } +2024-07-30 02:27:36,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 56/ 3125], loss: 1.341, per_step_time: 1413ms, lr: 1.9572954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:36,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.66046 samples/s/p 3:39:30 } +2024-07-30 02:27:39,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 58/ 3125], loss: 1.275, per_step_time: 1413ms, lr: 2.0284697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:39,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.66112 samples/s/p 3:39:26 } +2024-07-30 02:27:42,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 60/ 3125], loss: 1.126, per_step_time: 1414ms, lr: 2.099644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:42,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.65669 samples/s/p 3:39:33 } +2024-07-30 02:27:45,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 62/ 3125], loss: 1.619, per_step_time: 1413ms, lr: 2.1708183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:45,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.65832 samples/s/p 3:39:27 } +2024-07-30 02:27:48,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 64/ 3125], loss: 1.251, per_step_time: 1415ms, lr: 2.2419927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:48,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.65156 samples/s/p 3:39:40 } +2024-07-30 02:27:51,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 66/ 3125], loss: 1.324, per_step_time: 1413ms, lr: 2.3131672e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:51,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.65966 samples/s/p 3:39:18 } +2024-07-30 02:27:53,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 68/ 3125], loss: 1.160, per_step_time: 1413ms, lr: 2.3843415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:53,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.65822 samples/s/p 3:39:18 } +2024-07-30 02:27:56,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 70/ 3125], loss: 1.056, per_step_time: 1413ms, lr: 2.4555159e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:56,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.65806 samples/s/p 3:39:16 } +2024-07-30 02:27:59,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 72/ 3125], loss: 1.486, per_step_time: 1415ms, lr: 2.5266902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:27:59,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.65350 samples/s/p 3:39:24 } +2024-07-30 02:28:02,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 74/ 3125], loss: 1.359, per_step_time: 1414ms, lr: 2.5978647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:02,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.65639 samples/s/p 3:39:14 } +2024-07-30 02:28:05,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 76/ 3125], loss: 1.356, per_step_time: 1415ms, lr: 2.669039e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:05,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.65172 samples/s/p 3:39:22 } +2024-07-30 02:28:08,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 78/ 3125], loss: 1.349, per_step_time: 1414ms, lr: 2.7402134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:08,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.65672 samples/s/p 3:39:08 } +2024-07-30 02:28:10,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 80/ 3125], loss: 1.630, per_step_time: 1412ms, lr: 2.8113877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:10,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.66208 samples/s/p 3:38:52 } +2024-07-30 02:28:13,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 82/ 3125], loss: 1.549, per_step_time: 1414ms, lr: 2.8825623e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:13,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.65723 samples/s/p 3:39:01 } +2024-07-30 02:28:16,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 84/ 3125], loss: 1.097, per_step_time: 1413ms, lr: 2.9537364e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:16,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.66052 samples/s/p 3:38:50 } +2024-07-30 02:28:19,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 86/ 3125], loss: 1.357, per_step_time: 1412ms, lr: 3.024911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:19,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.66174 samples/s/p 3:38:45 } +2024-07-30 02:28:22,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 88/ 3125], loss: 1.011, per_step_time: 1416ms, lr: 3.0960855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:22,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.64734 samples/s/p 3:39:15 } +2024-07-30 02:28:25,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 90/ 3125], loss: 0.990, per_step_time: 1413ms, lr: 3.1672596e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:25,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.66094 samples/s/p 3:38:41 } +2024-07-30 02:28:27,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 92/ 3125], loss: 1.119, per_step_time: 1414ms, lr: 3.2384341e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:27,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.65634 samples/s/p 3:38:49 } +2024-07-30 02:28:30,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 94/ 3125], loss: 1.152, per_step_time: 1413ms, lr: 3.3096082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:30,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.65793 samples/s/p 3:38:42 } +2024-07-30 02:28:33,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 96/ 3125], loss: 1.270, per_step_time: 1413ms, lr: 3.3807828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:33,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.65952 samples/s/p 3:38:36 } +2024-07-30 02:28:36,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 98/ 3125], loss: 1.162, per_step_time: 1415ms, lr: 3.4519574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:36,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.65359 samples/s/p 3:38:47 } +2024-07-30 02:28:39,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 100/ 3125], loss: 0.916, per_step_time: 1412ms, lr: 3.5231315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:39,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.66198 samples/s/p 3:38:24 } +2024-07-30 02:28:42,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 102/ 3125], loss: 1.030, per_step_time: 1414ms, lr: 3.594306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:42,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.65557 samples/s/p 3:38:36 } +2024-07-30 02:28:44,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 104/ 3125], loss: 1.432, per_step_time: 1415ms, lr: 3.6654803e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:44,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.65342 samples/s/p 3:38:39 } +2024-07-30 02:28:47,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 106/ 3125], loss: 1.152, per_step_time: 1413ms, lr: 3.7366547e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:47,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.65954 samples/s/p 3:38:22 } +2024-07-30 02:28:50,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 108/ 3125], loss: 1.291, per_step_time: 1413ms, lr: 3.807829e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:50,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.65864 samples/s/p 3:38:21 } +2024-07-30 02:28:53,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 110/ 3125], loss: 1.239, per_step_time: 1413ms, lr: 3.8790035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:53,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.66048 samples/s/p 3:38:14 } +2024-07-30 02:28:56,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 112/ 3125], loss: 1.071, per_step_time: 1415ms, lr: 3.950178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:56,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.65347 samples/s/p 3:38:27 } +2024-07-30 02:28:59,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 114/ 3125], loss: 1.148, per_step_time: 1414ms, lr: 4.021352e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:28:59,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.65715 samples/s/p 3:38:16 } +2024-07-30 02:29:02,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 116/ 3125], loss: 1.301, per_step_time: 1412ms, lr: 4.0925265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:02,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.66179 samples/s/p 3:38:02 } +2024-07-30 02:29:04,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 118/ 3125], loss: 0.982, per_step_time: 1413ms, lr: 4.163701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:04,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.65797 samples/s/p 3:38:08 } +2024-07-30 02:29:07,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 120/ 3125], loss: 1.209, per_step_time: 1414ms, lr: 4.234875e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:07,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.65686 samples/s/p 3:38:08 } +2024-07-30 02:29:10,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 122/ 3125], loss: 0.910, per_step_time: 1414ms, lr: 4.3060495e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:10,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.65584 samples/s/p 3:38:08 } +2024-07-30 02:29:13,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 124/ 3125], loss: 1.276, per_step_time: 1414ms, lr: 4.377224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:13,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.65506 samples/s/p 3:38:07 } +2024-07-30 02:29:16,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 126/ 3125], loss: 1.127, per_step_time: 1414ms, lr: 4.4483986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:16,178 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.65722 samples/s/p 3:37:59 } +2024-07-30 02:29:19,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 128/ 3125], loss: 0.940, per_step_time: 1414ms, lr: 4.519573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:19,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.65770 samples/s/p 3:37:55 } +2024-07-30 02:29:21,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 130/ 3125], loss: 1.026, per_step_time: 1412ms, lr: 4.5907473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:21,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.66229 samples/s/p 3:37:41 } +2024-07-30 02:29:24,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 132/ 3125], loss: 0.990, per_step_time: 1414ms, lr: 4.6619216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:24,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.65621 samples/s/p 3:37:53 } +2024-07-30 02:29:27,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 134/ 3125], loss: 1.413, per_step_time: 1413ms, lr: 4.733096e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:27,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.65994 samples/s/p 3:37:41 } +2024-07-30 02:29:30,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 136/ 3125], loss: 1.120, per_step_time: 1414ms, lr: 4.8042702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:30,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.65743 samples/s/p 3:37:44 } +2024-07-30 02:29:33,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 138/ 3125], loss: 0.952, per_step_time: 1415ms, lr: 4.8754446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:33,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.65333 samples/s/p 3:37:51 } +2024-07-30 02:29:36,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 140/ 3125], loss: 1.111, per_step_time: 1413ms, lr: 4.9466194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:36,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.65836 samples/s/p 3:37:36 } +2024-07-30 02:29:38,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 142/ 3125], loss: 1.099, per_step_time: 1414ms, lr: 5.0177937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:38,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.65612 samples/s/p 3:37:39 } +2024-07-30 02:29:41,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 144/ 3125], loss: 1.208, per_step_time: 1414ms, lr: 5.0889676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:41,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.65736 samples/s/p 3:37:33 } +2024-07-30 02:29:44,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 146/ 3125], loss: 1.044, per_step_time: 1413ms, lr: 5.160142e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:44,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.66003 samples/s/p 3:37:24 } +2024-07-30 02:29:47,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 148/ 3125], loss: 1.002, per_step_time: 1413ms, lr: 5.2313167e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:47,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.66080 samples/s/p 3:37:19 } +2024-07-30 02:29:50,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 150/ 3125], loss: 1.366, per_step_time: 1413ms, lr: 5.302491e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:50,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.66072 samples/s/p 3:37:17 } +2024-07-30 02:29:53,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 152/ 3125], loss: 0.954, per_step_time: 1413ms, lr: 5.3736658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:53,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.66098 samples/s/p 3:37:13 } +2024-07-30 02:29:55,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 154/ 3125], loss: 0.976, per_step_time: 1413ms, lr: 5.4448396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:55,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.66014 samples/s/p 3:37:12 } +2024-07-30 02:29:58,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 156/ 3125], loss: 1.448, per_step_time: 1415ms, lr: 5.516014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:29:58,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.65251 samples/s/p 3:37:27 } +2024-07-30 02:30:01,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 158/ 3125], loss: 1.134, per_step_time: 1413ms, lr: 5.5871883e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:01,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.65912 samples/s/p 3:37:09 } +2024-07-30 02:30:04,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 160/ 3125], loss: 1.046, per_step_time: 1413ms, lr: 5.658363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:04,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.65903 samples/s/p 3:37:06 } +2024-07-30 02:30:07,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 162/ 3125], loss: 1.002, per_step_time: 1414ms, lr: 5.7295374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:07,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.65467 samples/s/p 3:37:14 } +2024-07-30 02:30:10,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 164/ 3125], loss: 0.902, per_step_time: 1412ms, lr: 5.8007113e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:10,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.66222 samples/s/p 3:36:53 } +2024-07-30 02:30:12,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 166/ 3125], loss: 1.278, per_step_time: 1413ms, lr: 5.871886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:12,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.65897 samples/s/p 3:36:58 } +2024-07-30 02:30:15,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 168/ 3125], loss: 0.935, per_step_time: 1415ms, lr: 5.9430604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:15,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.65244 samples/s/p 3:37:10 } +2024-07-30 02:30:18,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 170/ 3125], loss: 0.847, per_step_time: 1413ms, lr: 6.0142347e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:18,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.65900 samples/s/p 3:36:52 } +2024-07-30 02:30:21,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 172/ 3125], loss: 0.977, per_step_time: 1413ms, lr: 6.0854086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:21,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.66138 samples/s/p 3:36:44 } +2024-07-30 02:30:24,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 174/ 3125], loss: 1.147, per_step_time: 1413ms, lr: 6.1565834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:24,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.66034 samples/s/p 3:36:44 } +2024-07-30 02:30:27,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 176/ 3125], loss: 0.650, per_step_time: 1413ms, lr: 6.2277577e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:27,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.66082 samples/s/p 3:36:40 } +2024-07-30 02:30:29,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 178/ 3125], loss: 0.672, per_step_time: 1413ms, lr: 6.2989325e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:29,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.65967 samples/s/p 3:36:40 } +2024-07-30 02:30:32,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 180/ 3125], loss: 0.873, per_step_time: 1413ms, lr: 6.370107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:32,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.66028 samples/s/p 3:36:35 } +2024-07-30 02:30:35,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 182/ 3125], loss: 1.075, per_step_time: 1416ms, lr: 6.4412807e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:35,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.64734 samples/s/p 3:37:02 } +2024-07-30 02:30:38,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 184/ 3125], loss: 0.945, per_step_time: 1413ms, lr: 6.512455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:38,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% | | 5.65902 samples/s/p 3:36:33 } +2024-07-30 02:30:41,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 186/ 3125], loss: 0.759, per_step_time: 1415ms, lr: 6.58363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:41,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% | | 5.65232 samples/s/p 3:36:45 } +2024-07-30 02:30:44,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 188/ 3125], loss: 0.980, per_step_time: 1414ms, lr: 6.654804e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:44,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.65680 samples/s/p 3:36:32 } +2024-07-30 02:30:46,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 190/ 3125], loss: 1.129, per_step_time: 1413ms, lr: 6.725979e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:46,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.66160 samples/s/p 3:36:18 } +2024-07-30 02:30:49,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 192/ 3125], loss: 0.925, per_step_time: 1413ms, lr: 6.7971528e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:49,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.65894 samples/s/p 3:36:21 } +2024-07-30 02:30:52,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 194/ 3125], loss: 0.785, per_step_time: 1413ms, lr: 6.868327e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:52,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.66028 samples/s/p 3:36:16 } +2024-07-30 02:30:55,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 196/ 3125], loss: 1.030, per_step_time: 1413ms, lr: 6.9395014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:55,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.66026 samples/s/p 3:36:13 } +2024-07-30 02:30:58,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 198/ 3125], loss: 0.733, per_step_time: 1413ms, lr: 7.010676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:30:58,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.66017 samples/s/p 3:36:10 } +2024-07-30 02:31:01,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 200/ 3125], loss: 0.688, per_step_time: 1414ms, lr: 7.0818505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:01,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.65451 samples/s/p 3:36:20 } +2024-07-30 02:31:03,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 202/ 3125], loss: 0.663, per_step_time: 1413ms, lr: 7.1530244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:03,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.65858 samples/s/p 3:36:08 } +2024-07-30 02:31:06,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 204/ 3125], loss: 0.988, per_step_time: 1414ms, lr: 7.224199e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:06,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.65435 samples/s/p 3:36:15 } +2024-07-30 02:31:09,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 206/ 3125], loss: 1.034, per_step_time: 1413ms, lr: 7.2953735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:09,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.65972 samples/s/p 3:36:00 } +2024-07-30 02:31:12,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 208/ 3125], loss: 0.978, per_step_time: 1414ms, lr: 7.366548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:12,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.65485 samples/s/p 3:36:08 } +2024-07-30 02:31:15,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 210/ 3125], loss: 0.827, per_step_time: 1413ms, lr: 7.4377217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:15,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.66157 samples/s/p 3:35:50 } +2024-07-30 02:31:18,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 212/ 3125], loss: 0.735, per_step_time: 1413ms, lr: 7.5088965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:18,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.65974 samples/s/p 3:35:51 } +2024-07-30 02:31:20,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 214/ 3125], loss: 0.890, per_step_time: 1414ms, lr: 7.580071e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:20,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.65482 samples/s/p 3:36:00 } +2024-07-30 02:31:23,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 216/ 3125], loss: 0.707, per_step_time: 1413ms, lr: 7.651245e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:23,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.66155 samples/s/p 3:35:42 } +2024-07-30 02:31:26,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 218/ 3125], loss: 0.747, per_step_time: 1413ms, lr: 7.7224195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:26,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.65957 samples/s/p 3:35:43 } +2024-07-30 02:31:29,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 220/ 3125], loss: 0.692, per_step_time: 1413ms, lr: 7.793594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:29,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.65963 samples/s/p 3:35:40 } +2024-07-30 02:31:32,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 222/ 3125], loss: 0.531, per_step_time: 1413ms, lr: 7.864768e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:32,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.65864 samples/s/p 3:35:40 } +2024-07-30 02:31:35,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 224/ 3125], loss: 0.898, per_step_time: 1415ms, lr: 7.935942e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:35,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.65196 samples/s/p 3:35:52 } +2024-07-30 02:31:37,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 226/ 3125], loss: 0.747, per_step_time: 1413ms, lr: 8.007118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:37,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.66100 samples/s/p 3:35:29 } +2024-07-30 02:31:40,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 228/ 3125], loss: 0.643, per_step_time: 1413ms, lr: 8.078292e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:40,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.65973 samples/s/p 3:35:29 } +2024-07-30 02:31:43,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 230/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 8.149465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:43,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.66011 samples/s/p 3:35:25 } +2024-07-30 02:31:46,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 232/ 3125], loss: 0.616, per_step_time: 1413ms, lr: 8.220641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:46,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.65887 samples/s/p 3:35:25 } +2024-07-30 02:31:49,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 234/ 3125], loss: 0.555, per_step_time: 1413ms, lr: 8.291815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:49,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.65966 samples/s/p 3:35:20 } +2024-07-30 02:31:52,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 236/ 3125], loss: 0.715, per_step_time: 1412ms, lr: 8.362989e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:52,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.66230 samples/s/p 3:35:12 } +2024-07-30 02:31:54,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 238/ 3125], loss: 0.645, per_step_time: 1413ms, lr: 8.434164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:54,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.65891 samples/s/p 3:35:16 } +2024-07-30 02:31:57,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 240/ 3125], loss: 0.602, per_step_time: 1413ms, lr: 8.505338e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:31:57,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.66121 samples/s/p 3:35:08 } +2024-07-30 02:32:00,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 242/ 3125], loss: 0.831, per_step_time: 1413ms, lr: 8.576512e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:00,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.65795 samples/s/p 3:35:13 } +2024-07-30 02:32:03,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 244/ 3125], loss: 0.463, per_step_time: 1413ms, lr: 8.647687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:03,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.65929 samples/s/p 3:35:07 } +2024-07-30 02:32:06,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 246/ 3125], loss: 0.654, per_step_time: 1413ms, lr: 8.718861e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:06,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.65894 samples/s/p 3:35:05 } +2024-07-30 02:32:09,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 248/ 3125], loss: 0.650, per_step_time: 1413ms, lr: 8.790035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:09,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.66006 samples/s/p 3:35:00 } +2024-07-30 02:32:11,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 250/ 3125], loss: 0.783, per_step_time: 1414ms, lr: 8.86121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:11,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.65444 samples/s/p 3:35:10 } +2024-07-30 02:32:14,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 252/ 3125], loss: 0.595, per_step_time: 1414ms, lr: 8.932384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:14,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.65611 samples/s/p 3:35:03 } +2024-07-30 02:32:17,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 254/ 3125], loss: 0.493, per_step_time: 1413ms, lr: 9.003558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:17,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.66006 samples/s/p 3:34:51 } +2024-07-30 02:32:20,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 256/ 3125], loss: 0.632, per_step_time: 1412ms, lr: 9.074733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:20,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.66229 samples/s/p 3:34:43 } +2024-07-30 02:32:23,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 258/ 3125], loss: 0.473, per_step_time: 1413ms, lr: 9.145907e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:23,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.65935 samples/s/p 3:34:47 } +2024-07-30 02:32:26,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 260/ 3125], loss: 0.446, per_step_time: 1413ms, lr: 9.217081e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:26,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.66098 samples/s/p 3:34:41 } +2024-07-30 02:32:28,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 262/ 3125], loss: 0.413, per_step_time: 1413ms, lr: 9.288256e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:28,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.65985 samples/s/p 3:34:40 } +2024-07-30 02:32:31,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 264/ 3125], loss: 0.407, per_step_time: 1413ms, lr: 9.359431e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:31,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.65983 samples/s/p 3:34:38 } +2024-07-30 02:32:34,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 266/ 3125], loss: 0.649, per_step_time: 1413ms, lr: 9.430605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:34,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.65965 samples/s/p 3:34:35 } +2024-07-30 02:32:37,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 268/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 9.501779e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:37,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.65627 samples/s/p 3:34:40 } +2024-07-30 02:32:40,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 270/ 3125], loss: 0.578, per_step_time: 1413ms, lr: 9.572954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:40,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.65849 samples/s/p 3:34:32 } +2024-07-30 02:32:43,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 272/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 9.644128e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:43,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.66132 samples/s/p 3:34:23 } +2024-07-30 02:32:45,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 274/ 3125], loss: 0.552, per_step_time: 1413ms, lr: 9.715302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:45,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.66095 samples/s/p 3:34:21 } +2024-07-30 02:32:48,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 276/ 3125], loss: 0.565, per_step_time: 1412ms, lr: 9.786476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:48,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.66179 samples/s/p 3:34:16 } +2024-07-30 02:32:51,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 278/ 3125], loss: 0.510, per_step_time: 1413ms, lr: 9.857651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:51,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.66064 samples/s/p 3:34:16 } +2024-07-30 02:32:54,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 280/ 3125], loss: 0.584, per_step_time: 1413ms, lr: 9.928825e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:54,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.66142 samples/s/p 3:34:11 } +2024-07-30 02:32:57,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 282/ 3125], loss: 0.441, per_step_time: 1413ms, lr: 1e-05, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:32:57,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.66076 samples/s/p 3:34:10 } +2024-07-30 02:33:00,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 284/ 3125], loss: 0.723, per_step_time: 1413ms, lr: 9.999999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:00,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.66144 samples/s/p 3:34:06 } +2024-07-30 02:33:02,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 286/ 3125], loss: 0.547, per_step_time: 1413ms, lr: 9.999995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:02,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.65966 samples/s/p 3:34:07 } +2024-07-30 02:33:05,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 288/ 3125], loss: 0.553, per_step_time: 1413ms, lr: 9.999989e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:05,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.65847 samples/s/p 3:34:07 } +2024-07-30 02:33:08,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 290/ 3125], loss: 0.653, per_step_time: 1413ms, lr: 9.999981e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:08,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.66113 samples/s/p 3:33:58 } +2024-07-30 02:33:11,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 292/ 3125], loss: 0.515, per_step_time: 1413ms, lr: 9.99997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:11,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.66137 samples/s/p 3:33:55 } +2024-07-30 02:33:14,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 294/ 3125], loss: 0.442, per_step_time: 1413ms, lr: 9.999957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:14,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.66059 samples/s/p 3:33:53 } +2024-07-30 02:33:17,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 296/ 3125], loss: 0.624, per_step_time: 1413ms, lr: 9.9999415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:17,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.65923 samples/s/p 3:33:54 } +2024-07-30 02:33:19,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 298/ 3125], loss: 0.522, per_step_time: 1413ms, lr: 9.999923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:19,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.65868 samples/s/p 3:33:52 } +2024-07-30 02:33:22,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 300/ 3125], loss: 0.537, per_step_time: 1414ms, lr: 9.999903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:22,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.65498 samples/s/p 3:33:58 } +2024-07-30 02:33:25,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 302/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 9.999881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:25,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.65824 samples/s/p 3:33:48 } +2024-07-30 02:33:28,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 304/ 3125], loss: 0.175, per_step_time: 1414ms, lr: 9.999855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:28,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.65660 samples/s/p 3:33:48 } +2024-07-30 02:33:31,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 306/ 3125], loss: 0.318, per_step_time: 1412ms, lr: 9.999828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:31,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.66244 samples/s/p 3:33:32 } +2024-07-30 02:33:34,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 308/ 3125], loss: 0.612, per_step_time: 1413ms, lr: 9.999798e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:34,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.65931 samples/s/p 3:33:37 } +2024-07-30 02:33:36,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 310/ 3125], loss: 0.388, per_step_time: 1413ms, lr: 9.999765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:36,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.65992 samples/s/p 3:33:32 } +2024-07-30 02:33:39,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 312/ 3125], loss: 0.609, per_step_time: 1413ms, lr: 9.9997305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:39,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.65987 samples/s/p 3:33:30 } +2024-07-30 02:33:42,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 314/ 3125], loss: 0.541, per_step_time: 1413ms, lr: 9.999694e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:42,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.65932 samples/s/p 3:33:28 } +2024-07-30 02:33:45,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 316/ 3125], loss: 0.526, per_step_time: 1413ms, lr: 9.999654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:45,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.65875 samples/s/p 3:33:27 } +2024-07-30 02:33:48,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 318/ 3125], loss: 0.440, per_step_time: 1413ms, lr: 9.999613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:48,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.66097 samples/s/p 3:33:19 } +2024-07-30 02:33:51,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 320/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 9.999569e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:51,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.65953 samples/s/p 3:33:19 } +2024-07-30 02:33:53,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 322/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 9.999521e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:53,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.66033 samples/s/p 3:33:15 } +2024-07-30 02:33:56,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 324/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 9.999473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:56,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.66083 samples/s/p 3:33:11 } +2024-07-30 02:33:59,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 326/ 3125], loss: 0.508, per_step_time: 1415ms, lr: 9.999422e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:33:59,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.65318 samples/s/p 3:33:25 } +2024-07-30 02:34:02,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 328/ 3125], loss: 0.454, per_step_time: 1413ms, lr: 9.999369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:02,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.65798 samples/s/p 3:33:11 } +2024-07-30 02:34:05,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 330/ 3125], loss: 0.249, per_step_time: 1426ms, lr: 9.999312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:05,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.60896 samples/s/p 3:35:00 } +2024-07-30 02:34:08,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 332/ 3125], loss: 0.287, per_step_time: 1414ms, lr: 9.999253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:08,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.65590 samples/s/p 3:33:10 } +2024-07-30 02:34:10,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 334/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 9.999193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:10,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.66040 samples/s/p 3:32:57 } +2024-07-30 02:34:13,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 336/ 3125], loss: 0.487, per_step_time: 1413ms, lr: 9.99913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:13,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.65995 samples/s/p 3:32:56 } +2024-07-30 02:34:16,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 338/ 3125], loss: 0.379, per_step_time: 1413ms, lr: 9.999064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:16,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.65977 samples/s/p 3:32:53 } +2024-07-30 02:34:19,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 340/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 9.998996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:19,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.66102 samples/s/p 3:32:48 } +2024-07-30 02:34:22,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 342/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 9.998925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:22,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.65898 samples/s/p 3:32:49 } +2024-07-30 02:34:25,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 344/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 9.998853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:25,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.66010 samples/s/p 3:32:44 } +2024-07-30 02:34:27,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 346/ 3125], loss: 0.434, per_step_time: 1412ms, lr: 9.998778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:27,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.66331 samples/s/p 3:32:34 } +2024-07-30 02:34:30,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 348/ 3125], loss: 0.441, per_step_time: 1413ms, lr: 9.9987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:30,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.65983 samples/s/p 3:32:39 } +2024-07-30 02:34:33,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 350/ 3125], loss: 0.393, per_step_time: 1416ms, lr: 9.99862e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:33,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.64675 samples/s/p 3:33:06 } +2024-07-30 02:34:36,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 352/ 3125], loss: 0.227, per_step_time: 1414ms, lr: 9.998537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:36,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.65693 samples/s/p 3:32:40 } +2024-07-30 02:34:39,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 354/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 9.998453e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:39,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.66147 samples/s/p 3:32:27 } +2024-07-30 02:34:42,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 356/ 3125], loss: 0.453, per_step_time: 1413ms, lr: 9.998366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:42,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.65866 samples/s/p 3:32:30 } +2024-07-30 02:34:45,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 358/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 9.998276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:45,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.66021 samples/s/p 3:32:24 } +2024-07-30 02:34:47,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 360/ 3125], loss: 0.478, per_step_time: 1414ms, lr: 9.998184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:47,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.65706 samples/s/p 3:32:28 } +2024-07-30 02:34:50,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 362/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 9.99809e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:50,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.65899 samples/s/p 3:32:21 } +2024-07-30 02:34:53,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 364/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 9.997993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:53,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.66151 samples/s/p 3:32:13 } +2024-07-30 02:34:56,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 366/ 3125], loss: 0.439, per_step_time: 1413ms, lr: 9.997894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:56,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.66058 samples/s/p 3:32:12 } +2024-07-30 02:34:59,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 368/ 3125], loss: 0.439, per_step_time: 1413ms, lr: 9.997793e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:34:59,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.66152 samples/s/p 3:32:07 } +2024-07-30 02:35:02,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 370/ 3125], loss: 0.284, per_step_time: 1425ms, lr: 9.99769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:02,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.61207 samples/s/p 3:33:56 } +2024-07-30 02:35:04,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 372/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 9.997583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:04,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |█ | 5.66005 samples/s/p 3:32:04 } +2024-07-30 02:35:07,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 374/ 3125], loss: 0.374, per_step_time: 1414ms, lr: 9.997474e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:07,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |█ | 5.65581 samples/s/p 3:32:11 } +2024-07-30 02:35:10,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 376/ 3125], loss: 0.395, per_step_time: 1413ms, lr: 9.997363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:10,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.66118 samples/s/p 3:31:56 } +2024-07-30 02:35:13,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 378/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 9.997249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:13,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.65958 samples/s/p 3:31:57 } +2024-07-30 02:35:16,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 380/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 9.997134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:16,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.65807 samples/s/p 3:31:58 } +2024-07-30 02:35:19,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 382/ 3125], loss: 0.343, per_step_time: 1414ms, lr: 9.997016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:19,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.65708 samples/s/p 3:31:57 } +2024-07-30 02:35:21,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 384/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 9.996896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:21,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.65803 samples/s/p 3:31:52 } +2024-07-30 02:35:24,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 386/ 3125], loss: 0.075, per_step_time: 1414ms, lr: 9.996773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:24,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.65575 samples/s/p 3:31:54 } +2024-07-30 02:35:27,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 388/ 3125], loss: 0.596, per_step_time: 1414ms, lr: 9.996647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:27,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.65763 samples/s/p 3:31:47 } +2024-07-30 02:35:30,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 390/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 9.996519e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:30,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.66087 samples/s/p 3:31:37 } +2024-07-30 02:35:33,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 392/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 9.996389e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:33,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.66148 samples/s/p 3:31:33 } +2024-07-30 02:35:36,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 394/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 9.996256e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:36,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.66051 samples/s/p 3:31:32 } +2024-07-30 02:35:38,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 396/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 9.996122e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:38,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.65871 samples/s/p 3:31:34 } +2024-07-30 02:35:41,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 398/ 3125], loss: 0.186, per_step_time: 1414ms, lr: 9.995984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:41,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.65378 samples/s/p 3:31:42 } +2024-07-30 02:35:44,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 400/ 3125], loss: 0.145, per_step_time: 1412ms, lr: 9.995845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:44,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.66212 samples/s/p 3:31:20 } +2024-07-30 02:35:47,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 402/ 3125], loss: 0.443, per_step_time: 1413ms, lr: 9.995703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:47,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.65979 samples/s/p 3:31:23 } +2024-07-30 02:35:50,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 404/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 9.995558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:50,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.65946 samples/s/p 3:31:21 } +2024-07-30 02:35:53,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 406/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 9.995412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:53,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.65936 samples/s/p 3:31:18 } +2024-07-30 02:35:55,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 408/ 3125], loss: 0.248, per_step_time: 1414ms, lr: 9.995262e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:55,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.65741 samples/s/p 3:31:20 } +2024-07-30 02:35:58,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 410/ 3125], loss: 0.428, per_step_time: 1413ms, lr: 9.995111e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:35:58,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.65951 samples/s/p 3:31:12 } +2024-07-30 02:36:01,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 412/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 9.994957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:01,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.65987 samples/s/p 3:31:08 } +2024-07-30 02:36:04,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 414/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 9.994801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:04,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.66079 samples/s/p 3:31:03 } +2024-07-30 02:36:07,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 416/ 3125], loss: 0.382, per_step_time: 1414ms, lr: 9.994643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:07,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.65750 samples/s/p 3:31:08 } +2024-07-30 02:36:10,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 418/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 9.994482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:10,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.66040 samples/s/p 3:30:59 } +2024-07-30 02:36:12,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 420/ 3125], loss: 0.203, per_step_time: 1412ms, lr: 9.994317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:12,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.66250 samples/s/p 3:30:51 } +2024-07-30 02:36:15,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 422/ 3125], loss: 0.357, per_step_time: 1413ms, lr: 9.994152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:15,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.65804 samples/s/p 3:30:58 } +2024-07-30 02:36:18,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 424/ 3125], loss: 0.239, per_step_time: 1412ms, lr: 9.993983e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:18,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.66200 samples/s/p 3:30:47 } +2024-07-30 02:36:21,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 426/ 3125], loss: 0.266, per_step_time: 1412ms, lr: 9.9938125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:21,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.66193 samples/s/p 3:30:44 } +2024-07-30 02:36:24,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 428/ 3125], loss: 0.408, per_step_time: 1413ms, lr: 9.99364e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:24,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.66152 samples/s/p 3:30:42 } +2024-07-30 02:36:27,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 430/ 3125], loss: 0.458, per_step_time: 1413ms, lr: 9.993465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:27,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.65951 samples/s/p 3:30:44 } +2024-07-30 02:36:29,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 432/ 3125], loss: 0.196, per_step_time: 1414ms, lr: 9.993287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:29,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.65763 samples/s/p 3:30:45 } +2024-07-30 02:36:32,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 434/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 9.993107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:32,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.65979 samples/s/p 3:30:37 } +2024-07-30 02:36:35,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 436/ 3125], loss: 0.404, per_step_time: 1414ms, lr: 9.992924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:35,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.65721 samples/s/p 3:30:40 } +2024-07-30 02:36:38,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 438/ 3125], loss: 0.274, per_step_time: 1414ms, lr: 9.992738e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:38,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.65697 samples/s/p 3:30:38 } +2024-07-30 02:36:41,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 440/ 3125], loss: 0.661, per_step_time: 1413ms, lr: 9.992552e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:41,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.66031 samples/s/p 3:30:28 } +2024-07-30 02:36:44,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 442/ 3125], loss: 0.255, per_step_time: 1416ms, lr: 9.992362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:44,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.64748 samples/s/p 3:30:54 } +2024-07-30 02:36:46,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 444/ 3125], loss: 0.383, per_step_time: 1413ms, lr: 9.99217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:46,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.65805 samples/s/p 3:30:27 } +2024-07-30 02:36:49,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 446/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 9.991976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:49,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.65979 samples/s/p 3:30:20 } +2024-07-30 02:36:52,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 448/ 3125], loss: 0.331, per_step_time: 1415ms, lr: 9.991779e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:52,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.65298 samples/s/p 3:30:33 } +2024-07-30 02:36:55,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 450/ 3125], loss: 0.209, per_step_time: 1412ms, lr: 9.99158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:55,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.66256 samples/s/p 3:30:09 } +2024-07-30 02:36:58,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 452/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 9.991378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:36:58,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.65978 samples/s/p 3:30:12 } +2024-07-30 02:37:01,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 454/ 3125], loss: 0.512, per_step_time: 1414ms, lr: 9.991173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:01,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.65720 samples/s/p 3:30:15 } +2024-07-30 02:37:03,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 456/ 3125], loss: 0.390, per_step_time: 1414ms, lr: 9.990968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:03,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.65557 samples/s/p 3:30:16 } +2024-07-30 02:37:06,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 458/ 3125], loss: 0.349, per_step_time: 1414ms, lr: 9.990758e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:06,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.65736 samples/s/p 3:30:09 } +2024-07-30 02:37:09,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 460/ 3125], loss: 0.634, per_step_time: 1412ms, lr: 9.990547e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:09,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.66418 samples/s/p 3:29:51 } +2024-07-30 02:37:12,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 462/ 3125], loss: 0.333, per_step_time: 1412ms, lr: 9.990334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:12,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.66189 samples/s/p 3:29:53 } +2024-07-30 02:37:15,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 464/ 3125], loss: 0.291, per_step_time: 1414ms, lr: 9.990118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:15,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.65503 samples/s/p 3:30:06 } +2024-07-30 02:37:18,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 466/ 3125], loss: 0.124, per_step_time: 1413ms, lr: 9.9899e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:18,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.65972 samples/s/p 3:29:52 } +2024-07-30 02:37:20,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 468/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 9.98968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:20,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.66140 samples/s/p 3:29:46 } +2024-07-30 02:37:23,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 470/ 3125], loss: 0.148, per_step_time: 1412ms, lr: 9.989456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:23,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.66197 samples/s/p 3:29:42 } +2024-07-30 02:37:26,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 472/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 9.98923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:26,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.65957 samples/s/p 3:29:44 } +2024-07-30 02:37:29,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 474/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 9.989003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:29,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.66017 samples/s/p 3:29:40 } +2024-07-30 02:37:32,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 476/ 3125], loss: 0.678, per_step_time: 1413ms, lr: 9.988773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:32,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.66005 samples/s/p 3:29:37 } +2024-07-30 02:37:35,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 478/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 9.98854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:35,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.65938 samples/s/p 3:29:36 } +2024-07-30 02:37:37,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 480/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 9.9883055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:37,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.65916 samples/s/p 3:29:34 } +2024-07-30 02:37:40,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 482/ 3125], loss: 0.129, per_step_time: 1414ms, lr: 9.988068e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:40,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.65548 samples/s/p 3:29:39 } +2024-07-30 02:37:43,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 484/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 9.987828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:43,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.66112 samples/s/p 3:29:24 } +2024-07-30 02:37:46,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 486/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 9.987586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:46,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.65885 samples/s/p 3:29:26 } +2024-07-30 02:37:49,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 488/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 9.987341e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:49,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.65913 samples/s/p 3:29:23 } +2024-07-30 02:37:52,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 490/ 3125], loss: 0.480, per_step_time: 1413ms, lr: 9.987094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:52,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.66130 samples/s/p 3:29:15 } +2024-07-30 02:37:54,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 492/ 3125], loss: 0.380, per_step_time: 1413ms, lr: 9.986845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:54,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.65791 samples/s/p 3:29:20 } +2024-07-30 02:37:57,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 494/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 9.986594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:37:57,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.65801 samples/s/p 3:29:17 } +2024-07-30 02:38:00,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 496/ 3125], loss: 0.252, per_step_time: 1414ms, lr: 9.986339e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:00,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.65731 samples/s/p 3:29:15 } +2024-07-30 02:38:03,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 498/ 3125], loss: 0.270, per_step_time: 1414ms, lr: 9.986084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:03,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.65697 samples/s/p 3:29:13 } +2024-07-30 02:38:06,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 500/ 3125], loss: 0.292, per_step_time: 1414ms, lr: 9.985824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:06,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.65756 samples/s/p 3:29:09 } +2024-07-30 02:38:09,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 502/ 3125], loss: 0.396, per_step_time: 1413ms, lr: 9.985563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:09,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.66010 samples/s/p 3:29:01 } +2024-07-30 02:38:11,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 504/ 3125], loss: 0.282, per_step_time: 1412ms, lr: 9.9853005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:11,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.66352 samples/s/p 3:28:50 } +2024-07-30 02:38:14,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 506/ 3125], loss: 0.261, per_step_time: 1414ms, lr: 9.985034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:14,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.65635 samples/s/p 3:29:03 } +2024-07-30 02:38:17,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 508/ 3125], loss: 0.528, per_step_time: 1413ms, lr: 9.984766e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:17,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.66058 samples/s/p 3:28:51 } +2024-07-30 02:38:20,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 510/ 3125], loss: 0.415, per_step_time: 1413ms, lr: 9.984494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:20,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.65859 samples/s/p 3:28:53 } +2024-07-30 02:38:23,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 512/ 3125], loss: 0.172, per_step_time: 1415ms, lr: 9.984221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:23,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.65301 samples/s/p 3:29:02 } +2024-07-30 02:38:26,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 514/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 9.983946e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:26,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.65981 samples/s/p 3:28:44 } +2024-07-30 02:38:28,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 516/ 3125], loss: 0.139, per_step_time: 1412ms, lr: 9.983668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:28,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.66199 samples/s/p 3:28:37 } +2024-07-30 02:38:31,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 518/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 9.983388e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:31,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.66067 samples/s/p 3:28:37 } +2024-07-30 02:38:34,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 520/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 9.983105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:34,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.65971 samples/s/p 3:28:36 } +2024-07-30 02:38:37,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 522/ 3125], loss: 0.416, per_step_time: 1413ms, lr: 9.98282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:37,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.66006 samples/s/p 3:28:32 } +2024-07-30 02:38:40,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 524/ 3125], loss: 0.506, per_step_time: 1412ms, lr: 9.982533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:40,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.66193 samples/s/p 3:28:25 } +2024-07-30 02:38:43,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 526/ 3125], loss: 0.324, per_step_time: 1412ms, lr: 9.982244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:43,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.66221 samples/s/p 3:28:22 } +2024-07-30 02:38:45,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 528/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 9.981952e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:45,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.66156 samples/s/p 3:28:21 } +2024-07-30 02:38:48,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 530/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 9.981657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:48,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.66001 samples/s/p 3:28:21 } +2024-07-30 02:38:51,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 532/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 9.981361e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:51,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.66131 samples/s/p 3:28:16 } +2024-07-30 02:38:54,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 534/ 3125], loss: 0.335, per_step_time: 1413ms, lr: 9.981061e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:54,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.66054 samples/s/p 3:28:14 } +2024-07-30 02:38:57,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 536/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 9.980759e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:38:57,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.66036 samples/s/p 3:28:12 } +2024-07-30 02:39:00,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 538/ 3125], loss: 0.295, per_step_time: 1412ms, lr: 9.980456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:00,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.66214 samples/s/p 3:28:05 } +2024-07-30 02:39:02,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 540/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 9.980149e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:02,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.65967 samples/s/p 3:28:08 } +2024-07-30 02:39:05,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 542/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 9.97984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:05,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.66065 samples/s/p 3:28:03 } +2024-07-30 02:39:08,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 544/ 3125], loss: 0.380, per_step_time: 1413ms, lr: 9.979529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:08,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.65787 samples/s/p 3:28:06 } +2024-07-30 02:39:11,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 546/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 9.979216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:11,448 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.65401 samples/s/p 3:28:12 } +2024-07-30 02:39:14,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 548/ 3125], loss: 0.353, per_step_time: 1414ms, lr: 9.9788995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:14,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.65659 samples/s/p 3:28:03 } +2024-07-30 02:39:17,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 550/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 9.978581e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:17,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.65947 samples/s/p 3:27:54 } +2024-07-30 02:39:19,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 552/ 3125], loss: 0.391, per_step_time: 1415ms, lr: 9.978261e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:19,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.65218 samples/s/p 3:28:07 } +2024-07-30 02:39:22,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 554/ 3125], loss: 0.214, per_step_time: 1414ms, lr: 9.977938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:22,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.65723 samples/s/p 3:27:53 } +2024-07-30 02:39:25,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 556/ 3125], loss: 0.356, per_step_time: 1413ms, lr: 9.9776125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:25,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.66061 samples/s/p 3:27:43 } +2024-07-30 02:39:28,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 558/ 3125], loss: 0.101, per_step_time: 1413ms, lr: 9.977284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:28,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.66073 samples/s/p 3:27:40 } +2024-07-30 02:39:31,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 560/ 3125], loss: 0.340, per_step_time: 1412ms, lr: 9.976954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:31,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.66209 samples/s/p 3:27:34 } +2024-07-30 02:39:34,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 562/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 9.976621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:34,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.66027 samples/s/p 3:27:35 } +2024-07-30 02:39:36,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 564/ 3125], loss: 0.431, per_step_time: 1412ms, lr: 9.976287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:36,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |███ | 5.66179 samples/s/p 3:27:29 } +2024-07-30 02:39:39,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 566/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 9.97595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:39,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |███ | 5.65923 samples/s/p 3:27:32 } +2024-07-30 02:39:42,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 568/ 3125], loss: 0.368, per_step_time: 1412ms, lr: 9.97561e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:42,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.66300 samples/s/p 3:27:21 } +2024-07-30 02:39:45,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 570/ 3125], loss: 0.296, per_step_time: 1414ms, lr: 9.975269e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:45,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.65501 samples/s/p 3:27:36 } +2024-07-30 02:39:48,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 572/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 9.974923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:48,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.65927 samples/s/p 3:27:24 } +2024-07-30 02:39:51,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 574/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 9.974578e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:51,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.65863 samples/s/p 3:27:22 } +2024-07-30 02:39:53,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 576/ 3125], loss: 0.225, per_step_time: 1414ms, lr: 9.974228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:53,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.65618 samples/s/p 3:27:25 } +2024-07-30 02:39:56,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 578/ 3125], loss: 0.401, per_step_time: 1414ms, lr: 9.973876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:56,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.65719 samples/s/p 3:27:20 } +2024-07-30 02:39:59,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 580/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 9.9735225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:39:59,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.65972 samples/s/p 3:27:11 } +2024-07-30 02:40:02,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 582/ 3125], loss: 0.161, per_step_time: 1414ms, lr: 9.973166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:02,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.65728 samples/s/p 3:27:14 } +2024-07-30 02:40:05,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 584/ 3125], loss: 0.215, per_step_time: 1418ms, lr: 9.972808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:05,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.64004 samples/s/p 3:27:49 } +2024-07-30 02:40:08,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 586/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 9.972447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:08,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.66087 samples/s/p 3:27:00 } +2024-07-30 02:40:10,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 588/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 9.972084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:10,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.66018 samples/s/p 3:26:59 } +2024-07-30 02:40:13,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 590/ 3125], loss: 0.234, per_step_time: 1412ms, lr: 9.971717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:13,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.66202 samples/s/p 3:26:52 } +2024-07-30 02:40:16,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 592/ 3125], loss: 0.297, per_step_time: 1414ms, lr: 9.971349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:16,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.65759 samples/s/p 3:26:59 } +2024-07-30 02:40:19,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 594/ 3125], loss: 0.353, per_step_time: 1413ms, lr: 9.970979e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:19,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.65775 samples/s/p 3:26:56 } +2024-07-30 02:40:22,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 596/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 9.970605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:22,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.65777 samples/s/p 3:26:53 } +2024-07-30 02:40:25,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 598/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 9.970231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:25,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.65954 samples/s/p 3:26:46 } +2024-07-30 02:40:27,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 600/ 3125], loss: 0.290, per_step_time: 1415ms, lr: 9.969853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:27,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.65221 samples/s/p 3:26:59 } +2024-07-30 02:40:30,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 602/ 3125], loss: 0.510, per_step_time: 1413ms, lr: 9.969473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:30,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.65956 samples/s/p 3:26:40 } +2024-07-30 02:40:33,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 604/ 3125], loss: 0.393, per_step_time: 1413ms, lr: 9.96909e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:33,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.65995 samples/s/p 3:26:37 } +2024-07-30 02:40:36,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 606/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 9.968706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:36,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.65970 samples/s/p 3:26:34 } +2024-07-30 02:40:39,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 608/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 9.968318e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:39,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.65818 samples/s/p 3:26:35 } +2024-07-30 02:40:42,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 610/ 3125], loss: 0.314, per_step_time: 1412ms, lr: 9.967929e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:42,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.66231 samples/s/p 3:26:23 } +2024-07-30 02:40:44,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 612/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 9.967536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:44,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.66070 samples/s/p 3:26:24 } +2024-07-30 02:40:47,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 614/ 3125], loss: 0.292, per_step_time: 1413ms, lr: 9.967143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:47,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.65958 samples/s/p 3:26:23 } +2024-07-30 02:40:50,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 616/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 9.966746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:50,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.66055 samples/s/p 3:26:19 } +2024-07-30 02:40:53,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 618/ 3125], loss: 0.285, per_step_time: 1415ms, lr: 9.966347e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:53,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.65134 samples/s/p 3:26:36 } +2024-07-30 02:40:56,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 620/ 3125], loss: 0.511, per_step_time: 1413ms, lr: 9.9659455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:56,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.66088 samples/s/p 3:26:12 } +2024-07-30 02:40:59,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 622/ 3125], loss: 0.245, per_step_time: 1414ms, lr: 9.965543e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:40:59,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.65623 samples/s/p 3:26:19 } +2024-07-30 02:41:02,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 624/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 9.965136e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:02,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.66077 samples/s/p 3:26:07 } +2024-07-30 02:41:04,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 626/ 3125], loss: 0.162, per_step_time: 1412ms, lr: 9.964728e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:04,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.66231 samples/s/p 3:26:01 } +2024-07-30 02:41:07,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 628/ 3125], loss: 0.399, per_step_time: 1413ms, lr: 9.964317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:07,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.65857 samples/s/p 3:26:06 } +2024-07-30 02:41:10,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 630/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 9.963903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:10,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.66073 samples/s/p 3:25:58 } +2024-07-30 02:41:13,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 632/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 9.963488e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:13,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.65902 samples/s/p 3:25:59 } +2024-07-30 02:41:16,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 634/ 3125], loss: 0.229, per_step_time: 1415ms, lr: 9.96307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:16,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.65135 samples/s/p 3:26:13 } +2024-07-30 02:41:19,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 636/ 3125], loss: 0.381, per_step_time: 1414ms, lr: 9.96265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:19,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.65633 samples/s/p 3:25:59 } +2024-07-30 02:41:21,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 638/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 9.9622275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:21,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.65931 samples/s/p 3:25:50 } +2024-07-30 02:41:24,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 640/ 3125], loss: 0.256, per_step_time: 1412ms, lr: 9.961802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:24,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.66277 samples/s/p 3:25:40 } +2024-07-30 02:41:27,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 642/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 9.961374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:27,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.65940 samples/s/p 3:25:44 } +2024-07-30 02:41:30,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 644/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 9.960944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:30,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.65810 samples/s/p 3:25:44 } +2024-07-30 02:41:33,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 646/ 3125], loss: 0.375, per_step_time: 1414ms, lr: 9.960513e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:33,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.65500 samples/s/p 3:25:48 } +2024-07-30 02:41:36,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 648/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 9.9600775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:36,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.66099 samples/s/p 3:25:32 } +2024-07-30 02:41:38,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 650/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 9.959642e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:38,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.65936 samples/s/p 3:25:33 } +2024-07-30 02:41:41,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 652/ 3125], loss: 0.269, per_step_time: 1414ms, lr: 9.9592025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:41,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.65448 samples/s/p 3:25:41 } +2024-07-30 02:41:44,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 654/ 3125], loss: 0.319, per_step_time: 1414ms, lr: 9.9587605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:44,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.65514 samples/s/p 3:25:37 } +2024-07-30 02:41:47,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 656/ 3125], loss: 0.389, per_step_time: 1414ms, lr: 9.958317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:47,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.65742 samples/s/p 3:25:29 } +2024-07-30 02:41:50,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 658/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 9.95787e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:50,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.65960 samples/s/p 3:25:21 } +2024-07-30 02:41:53,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 660/ 3125], loss: 0.096, per_step_time: 1412ms, lr: 9.957421e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:53,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.66277 samples/s/p 3:25:12 } +2024-07-30 02:41:55,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 662/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 9.95697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:55,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.65887 samples/s/p 3:25:17 } +2024-07-30 02:41:58,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 664/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 9.956517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:41:58,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.66010 samples/s/p 3:25:12 } +2024-07-30 02:42:01,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 666/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 9.95606e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:01,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.66129 samples/s/p 3:25:06 } +2024-07-30 02:42:04,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 668/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 9.955603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:04,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.65821 samples/s/p 3:25:10 } +2024-07-30 02:42:07,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 670/ 3125], loss: 0.103, per_step_time: 1412ms, lr: 9.955142e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:07,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.66176 samples/s/p 3:25:00 } +2024-07-30 02:42:10,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 672/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 9.95468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:10,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.66138 samples/s/p 3:24:58 } +2024-07-30 02:42:12,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 674/ 3125], loss: 0.503, per_step_time: 1413ms, lr: 9.954214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:12,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.66117 samples/s/p 3:24:55 } +2024-07-30 02:42:15,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 676/ 3125], loss: 0.388, per_step_time: 1414ms, lr: 9.953746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:15,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.65437 samples/s/p 3:25:07 } +2024-07-30 02:42:18,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 678/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 9.953275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:18,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.65965 samples/s/p 3:24:53 } +2024-07-30 02:42:21,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 680/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 9.952803e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:21,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.65966 samples/s/p 3:24:50 } +2024-07-30 02:42:24,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 682/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 9.9523295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:24,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.65792 samples/s/p 3:24:51 } +2024-07-30 02:42:27,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 684/ 3125], loss: 0.480, per_step_time: 1414ms, lr: 9.951851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:27,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.65767 samples/s/p 3:24:49 } +2024-07-30 02:42:29,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 686/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 9.951372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:29,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.65923 samples/s/p 3:24:42 } +2024-07-30 02:42:32,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 688/ 3125], loss: 0.346, per_step_time: 1416ms, lr: 9.950891e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:32,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.64952 samples/s/p 3:25:01 } +2024-07-30 02:42:35,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 690/ 3125], loss: 0.391, per_step_time: 1414ms, lr: 9.950406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:35,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.65606 samples/s/p 3:24:44 } +2024-07-30 02:42:38,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 692/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 9.94992e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:38,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.65972 samples/s/p 3:24:33 } +2024-07-30 02:42:41,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 694/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 9.949431e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:41,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.66111 samples/s/p 3:24:27 } +2024-07-30 02:42:44,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 696/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 9.948939e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:44,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.66112 samples/s/p 3:24:24 } +2024-07-30 02:42:46,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 698/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 9.948445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:46,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.66104 samples/s/p 3:24:22 } +2024-07-30 02:42:49,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 700/ 3125], loss: 0.344, per_step_time: 1413ms, lr: 9.947949e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:49,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.65915 samples/s/p 3:24:23 } +2024-07-30 02:42:52,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 702/ 3125], loss: 0.373, per_step_time: 1416ms, lr: 9.947451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:52,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.64816 samples/s/p 3:24:44 } +2024-07-30 02:42:55,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 704/ 3125], loss: 0.209, per_step_time: 1414ms, lr: 9.946951e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:55,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.65530 samples/s/p 3:24:26 } +2024-07-30 02:42:58,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 706/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 9.946447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:42:58,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.66165 samples/s/p 3:24:09 } +2024-07-30 02:43:01,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 708/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 9.945942e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:01,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.65924 samples/s/p 3:24:11 } +2024-07-30 02:43:03,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 710/ 3125], loss: 0.420, per_step_time: 1412ms, lr: 9.945434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:03,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.66228 samples/s/p 3:24:02 } +2024-07-30 02:43:06,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 712/ 3125], loss: 0.347, per_step_time: 1412ms, lr: 9.9449235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:06,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.66176 samples/s/p 3:24:00 } +2024-07-30 02:43:09,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 714/ 3125], loss: 0.459, per_step_time: 1412ms, lr: 9.944411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:09,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.66267 samples/s/p 3:23:55 } +2024-07-30 02:43:12,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 716/ 3125], loss: 0.372, per_step_time: 1412ms, lr: 9.943897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:12,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.66251 samples/s/p 3:23:53 } +2024-07-30 02:43:15,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 718/ 3125], loss: 0.225, per_step_time: 1412ms, lr: 9.943379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:15,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.66212 samples/s/p 3:23:51 } +2024-07-30 02:43:18,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 720/ 3125], loss: 0.246, per_step_time: 1412ms, lr: 9.942859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:18,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.66291 samples/s/p 3:23:46 } +2024-07-30 02:43:20,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 722/ 3125], loss: 0.310, per_step_time: 1414ms, lr: 9.942337e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:20,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.65583 samples/s/p 3:23:59 } +2024-07-30 02:43:23,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 724/ 3125], loss: 0.183, per_step_time: 1414ms, lr: 9.941812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:23,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.65513 samples/s/p 3:23:58 } +2024-07-30 02:43:26,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 726/ 3125], loss: 0.421, per_step_time: 1414ms, lr: 9.941286e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:26,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.65508 samples/s/p 3:23:55 } +2024-07-30 02:43:29,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 728/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 9.940757e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:29,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.65972 samples/s/p 3:23:42 } +2024-07-30 02:43:32,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 730/ 3125], loss: 0.255, per_step_time: 1414ms, lr: 9.940226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:32,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.65731 samples/s/p 3:23:44 } +2024-07-30 02:43:35,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 732/ 3125], loss: 0.202, per_step_time: 1414ms, lr: 9.939692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:35,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.65759 samples/s/p 3:23:41 } +2024-07-30 02:43:37,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 734/ 3125], loss: 0.373, per_step_time: 1413ms, lr: 9.9391555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:37,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.66118 samples/s/p 3:23:30 } +2024-07-30 02:43:40,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 736/ 3125], loss: 0.418, per_step_time: 1413ms, lr: 9.938616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:40,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.66134 samples/s/p 3:23:27 } +2024-07-30 02:43:43,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 738/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 9.938076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:43,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.65899 samples/s/p 3:23:29 } +2024-07-30 02:43:46,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 740/ 3125], loss: 0.420, per_step_time: 1413ms, lr: 9.937533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:46,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.66168 samples/s/p 3:23:21 } +2024-07-30 02:43:49,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 742/ 3125], loss: 0.164, per_step_time: 1414ms, lr: 9.936987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:49,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.65665 samples/s/p 3:23:29 } +2024-07-30 02:43:52,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 744/ 3125], loss: 0.265, per_step_time: 1415ms, lr: 9.93644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:52,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.65247 samples/s/p 3:23:35 } +2024-07-30 02:43:54,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 746/ 3125], loss: 0.220, per_step_time: 1415ms, lr: 9.935889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:54,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |███ | 5.65084 samples/s/p 3:23:36 } +2024-07-30 02:43:57,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 748/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 9.9353365e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:43:57,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |███ | 5.65826 samples/s/p 3:23:17 } +2024-07-30 02:44:00,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 750/ 3125], loss: 0.195, per_step_time: 1414ms, lr: 9.934782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:00,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.65537 samples/s/p 3:23:20 } +2024-07-30 02:44:03,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 752/ 3125], loss: 0.465, per_step_time: 1414ms, lr: 9.934223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:03,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.65594 samples/s/p 3:23:16 } +2024-07-30 02:44:06,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 754/ 3125], loss: 0.249, per_step_time: 1414ms, lr: 9.933664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:06,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.65725 samples/s/p 3:23:11 } +2024-07-30 02:44:09,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 756/ 3125], loss: 0.281, per_step_time: 1412ms, lr: 9.933102e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:09,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.66196 samples/s/p 3:22:58 } +2024-07-30 02:44:11,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 758/ 3125], loss: 0.390, per_step_time: 1413ms, lr: 9.932538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:11,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.66037 samples/s/p 3:22:58 } +2024-07-30 02:44:14,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 760/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 9.931971e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:14,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.66052 samples/s/p 3:22:55 } +2024-07-30 02:44:17,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 762/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 9.931402e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:17,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.66038 samples/s/p 3:22:53 } +2024-07-30 02:44:20,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 764/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 9.93083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:20,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.65999 samples/s/p 3:22:51 } +2024-07-30 02:44:23,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 766/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 9.930256e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:23,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.66066 samples/s/p 3:22:46 } +2024-07-30 02:44:26,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 768/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 9.92968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:26,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.65970 samples/s/p 3:22:46 } +2024-07-30 02:44:28,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 770/ 3125], loss: 0.407, per_step_time: 1420ms, lr: 9.929101e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:28,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.63262 samples/s/p 3:23:41 } +2024-07-30 02:44:31,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 772/ 3125], loss: 0.230, per_step_time: 1421ms, lr: 9.928521e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:31,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.62869 samples/s/p 3:23:47 } +2024-07-30 02:44:34,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 774/ 3125], loss: 0.346, per_step_time: 1417ms, lr: 9.927937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:34,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.64472 samples/s/p 3:23:09 } +2024-07-30 02:44:37,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 776/ 3125], loss: 0.453, per_step_time: 1416ms, lr: 9.927351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:37,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.64871 samples/s/p 3:22:58 } +2024-07-30 02:44:40,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 778/ 3125], loss: 0.332, per_step_time: 1416ms, lr: 9.926764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:40,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.64946 samples/s/p 3:22:53 } +2024-07-30 02:44:43,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 780/ 3125], loss: 0.240, per_step_time: 1415ms, lr: 9.926173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:43,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.65183 samples/s/p 3:22:45 } +2024-07-30 02:44:45,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 782/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 9.92558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:45,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.65874 samples/s/p 3:22:28 } +2024-07-30 02:44:48,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 784/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 9.9249855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:48,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.66017 samples/s/p 3:22:22 } +2024-07-30 02:44:51,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 786/ 3125], loss: 0.095, per_step_time: 1414ms, lr: 9.924388e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:51,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.65415 samples/s/p 3:22:32 } +2024-07-30 02:44:54,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 788/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 9.923788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:54,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.65990 samples/s/p 3:22:17 } +2024-07-30 02:44:57,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 790/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 9.923186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:44:57,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.65970 samples/s/p 3:22:14 } +2024-07-30 02:45:00,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 792/ 3125], loss: 0.344, per_step_time: 1413ms, lr: 9.922582e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:00,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.65981 samples/s/p 3:22:11 } +2024-07-30 02:45:02,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 794/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 9.921975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:02,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.65941 samples/s/p 3:22:09 } +2024-07-30 02:45:05,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 796/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 9.921366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:05,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.66124 samples/s/p 3:22:03 } +2024-07-30 02:45:08,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 798/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 9.920755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:08,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.65837 samples/s/p 3:22:06 } +2024-07-30 02:45:11,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 800/ 3125], loss: 0.499, per_step_time: 1413ms, lr: 9.920141e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:11,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.65860 samples/s/p 3:22:03 } +2024-07-30 02:45:14,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 802/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 9.919525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:14,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.65971 samples/s/p 3:21:57 } +2024-07-30 02:45:17,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 804/ 3125], loss: 0.189, per_step_time: 1414ms, lr: 9.918906e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:17,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.65723 samples/s/p 3:22:00 } +2024-07-30 02:45:19,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 806/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 9.918285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:19,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.65903 samples/s/p 3:21:53 } +2024-07-30 02:45:22,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 808/ 3125], loss: 0.374, per_step_time: 1414ms, lr: 9.917661e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:22,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.65393 samples/s/p 3:22:01 } +2024-07-30 02:45:25,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 810/ 3125], loss: 0.288, per_step_time: 1421ms, lr: 9.917036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:25,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.62632 samples/s/p 3:22:58 } +2024-07-30 02:45:28,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 812/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 9.916408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:28,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.65908 samples/s/p 3:21:45 } +2024-07-30 02:45:31,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 814/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 9.915778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:31,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.66041 samples/s/p 3:21:39 } +2024-07-30 02:45:34,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 816/ 3125], loss: 0.241, per_step_time: 1416ms, lr: 9.915146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:34,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.64655 samples/s/p 3:22:06 } +2024-07-30 02:45:37,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 818/ 3125], loss: 0.152, per_step_time: 1425ms, lr: 9.91451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:37,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.61204 samples/s/p 3:23:18 } +2024-07-30 02:45:39,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 820/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 9.913872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:39,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.66062 samples/s/p 3:21:30 } +2024-07-30 02:45:42,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 822/ 3125], loss: 0.183, per_step_time: 1418ms, lr: 9.913233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:42,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.64051 samples/s/p 3:22:10 } +2024-07-30 02:45:45,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 824/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 9.912591e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:45,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.66167 samples/s/p 3:21:22 } +2024-07-30 02:45:48,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 826/ 3125], loss: 0.379, per_step_time: 1413ms, lr: 9.911947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:48,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.66038 samples/s/p 3:21:22 } +2024-07-30 02:45:51,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 828/ 3125], loss: 0.211, per_step_time: 1426ms, lr: 9.9112995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:51,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.60938 samples/s/p 3:23:09 } +2024-07-30 02:45:54,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 830/ 3125], loss: 0.451, per_step_time: 1412ms, lr: 9.910651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:54,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.66235 samples/s/p 3:21:12 } +2024-07-30 02:45:56,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 832/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 9.909999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:56,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.65989 samples/s/p 3:21:15 } +2024-07-30 02:45:59,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 834/ 3125], loss: 0.497, per_step_time: 1413ms, lr: 9.909346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:45:59,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.65917 samples/s/p 3:21:13 } +2024-07-30 02:46:02,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 836/ 3125], loss: 0.101, per_step_time: 1412ms, lr: 9.908689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:02,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.66246 samples/s/p 3:21:04 } +2024-07-30 02:46:05,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 838/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 9.908032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:05,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.66052 samples/s/p 3:21:05 } +2024-07-30 02:46:08,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 840/ 3125], loss: 0.184, per_step_time: 1412ms, lr: 9.90737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:08,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.66174 samples/s/p 3:20:59 } +2024-07-30 02:46:11,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 842/ 3125], loss: 0.334, per_step_time: 1413ms, lr: 9.906707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:11,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.65903 samples/s/p 3:21:02 } +2024-07-30 02:46:13,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 844/ 3125], loss: 0.366, per_step_time: 1415ms, lr: 9.906042e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:13,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.65272 samples/s/p 3:21:13 } +2024-07-30 02:46:16,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 846/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 9.905374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:16,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.66133 samples/s/p 3:20:52 } +2024-07-30 02:46:19,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 848/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 9.904704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:19,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.65793 samples/s/p 3:20:56 } +2024-07-30 02:46:22,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 850/ 3125], loss: 0.367, per_step_time: 1413ms, lr: 9.904032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:22,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.65921 samples/s/p 3:20:51 } +2024-07-30 02:46:25,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 852/ 3125], loss: 0.207, per_step_time: 1414ms, lr: 9.903357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:25,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.65670 samples/s/p 3:20:53 } +2024-07-30 02:46:28,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 854/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 9.902679e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:28,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.65977 samples/s/p 3:20:44 } +2024-07-30 02:46:30,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 856/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 9.902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:30,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.65772 samples/s/p 3:20:45 } +2024-07-30 02:46:33,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 858/ 3125], loss: 0.175, per_step_time: 1416ms, lr: 9.901319e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:33,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.64859 samples/s/p 3:21:02 } +2024-07-30 02:46:36,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 860/ 3125], loss: 0.427, per_step_time: 1414ms, lr: 9.900634e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:36,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.65578 samples/s/p 3:20:44 } +2024-07-30 02:46:39,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 862/ 3125], loss: 0.467, per_step_time: 1413ms, lr: 9.899947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:39,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.65988 samples/s/p 3:20:32 } +2024-07-30 02:46:42,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 864/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 9.899259e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:42,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.65870 samples/s/p 3:20:32 } +2024-07-30 02:46:45,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 866/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 9.8985665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:45,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.66031 samples/s/p 3:20:26 } +2024-07-30 02:46:47,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 868/ 3125], loss: 0.273, per_step_time: 1414ms, lr: 9.8978735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:47,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.65749 samples/s/p 3:20:29 } +2024-07-30 02:46:50,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 870/ 3125], loss: 0.532, per_step_time: 1413ms, lr: 9.897178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:50,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.66078 samples/s/p 3:20:19 } +2024-07-30 02:46:53,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 872/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 9.896479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:53,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.65771 samples/s/p 3:20:23 } +2024-07-30 02:46:56,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 874/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 9.895779e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:56,448 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.65977 samples/s/p 3:20:16 } +2024-07-30 02:46:59,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 876/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 9.895076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:46:59,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.66120 samples/s/p 3:20:10 } +2024-07-30 02:47:02,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 878/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 9.894371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:02,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.66024 samples/s/p 3:20:09 } +2024-07-30 02:47:04,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 880/ 3125], loss: 0.185, per_step_time: 1414ms, lr: 9.893663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:04,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.65552 samples/s/p 3:20:16 } +2024-07-30 02:47:07,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 882/ 3125], loss: 0.394, per_step_time: 1413ms, lr: 9.892953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:07,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.65934 samples/s/p 3:20:05 } +2024-07-30 02:47:10,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 884/ 3125], loss: 0.114, per_step_time: 1413ms, lr: 9.892241e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:10,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.65898 samples/s/p 3:20:03 } +2024-07-30 02:47:13,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 886/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 9.891526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:13,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.66058 samples/s/p 3:19:57 } +2024-07-30 02:47:16,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 888/ 3125], loss: 0.273, per_step_time: 1415ms, lr: 9.890809e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:16,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.65340 samples/s/p 3:20:09 } +2024-07-30 02:47:19,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 890/ 3125], loss: 0.151, per_step_time: 1412ms, lr: 9.89009e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:19,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.66258 samples/s/p 3:19:47 } +2024-07-30 02:47:21,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 892/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 9.889369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:21,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.65814 samples/s/p 3:19:54 } +2024-07-30 02:47:24,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 894/ 3125], loss: 0.480, per_step_time: 1414ms, lr: 9.888645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:24,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.65633 samples/s/p 3:19:55 } +2024-07-30 02:47:27,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 896/ 3125], loss: 0.519, per_step_time: 1413ms, lr: 9.887918e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:27,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.65813 samples/s/p 3:19:48 } +2024-07-30 02:47:30,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 898/ 3125], loss: 0.440, per_step_time: 1414ms, lr: 9.88719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:30,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.65748 samples/s/p 3:19:46 } +2024-07-30 02:47:33,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 900/ 3125], loss: 0.373, per_step_time: 1412ms, lr: 9.886458e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:33,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.66330 samples/s/p 3:19:31 } +2024-07-30 02:47:36,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 902/ 3125], loss: 0.330, per_step_time: 1413ms, lr: 9.885725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:36,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.65945 samples/s/p 3:19:37 } +2024-07-30 02:47:38,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 904/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 9.8849905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:38,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.65784 samples/s/p 3:19:37 } +2024-07-30 02:47:41,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 906/ 3125], loss: 0.260, per_step_time: 1414ms, lr: 9.884252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:41,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.65729 samples/s/p 3:19:36 } +2024-07-30 02:47:44,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 908/ 3125], loss: 0.134, per_step_time: 1414ms, lr: 9.883512e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:44,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.65756 samples/s/p 3:19:32 } +2024-07-30 02:47:47,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 910/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 9.8827695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:47,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.65884 samples/s/p 3:19:27 } +2024-07-30 02:47:50,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 912/ 3125], loss: 0.361, per_step_time: 1412ms, lr: 9.882025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:50,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.66185 samples/s/p 3:19:17 } +2024-07-30 02:47:53,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 914/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 9.881277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:53,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.65940 samples/s/p 3:19:20 } +2024-07-30 02:47:55,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 916/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 9.8805285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:55,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.66079 samples/s/p 3:19:14 } +2024-07-30 02:47:58,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 918/ 3125], loss: 0.065, per_step_time: 1413ms, lr: 9.879776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:47:58,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.65903 samples/s/p 3:19:15 } +2024-07-30 02:48:01,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 920/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 9.8790215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:01,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.65878 samples/s/p 3:19:13 } +2024-07-30 02:48:04,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 922/ 3125], loss: 0.426, per_step_time: 1414ms, lr: 9.878265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:04,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.65632 samples/s/p 3:19:15 } +2024-07-30 02:48:07,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 924/ 3125], loss: 0.222, per_step_time: 1414ms, lr: 9.877506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:07,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.65419 samples/s/p 3:19:17 } +2024-07-30 02:48:10,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 926/ 3125], loss: 0.194, per_step_time: 1414ms, lr: 9.876745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:10,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.65738 samples/s/p 3:19:07 } +2024-07-30 02:48:12,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 928/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 9.875981e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:12,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.65893 samples/s/p 3:19:01 } +2024-07-30 02:48:15,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 930/ 3125], loss: 0.175, per_step_time: 1414ms, lr: 9.875215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:15,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.65759 samples/s/p 3:19:01 } +2024-07-30 02:48:18,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 932/ 3125], loss: 0.094, per_step_time: 1413ms, lr: 9.874447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:18,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.66074 samples/s/p 3:18:52 } +2024-07-30 02:48:21,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 934/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 9.873676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:21,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |████ | 5.65479 samples/s/p 3:19:01 } +2024-07-30 02:48:24,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 936/ 3125], loss: 0.248, per_step_time: 1424ms, lr: 9.872903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:24,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |████ | 5.61474 samples/s/p 3:20:24 } +2024-07-30 02:48:27,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 938/ 3125], loss: 0.110, per_step_time: 1413ms, lr: 9.872128e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:27,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.65857 samples/s/p 3:18:48 } +2024-07-30 02:48:30,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 940/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 9.871351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:30,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.65991 samples/s/p 3:18:42 } +2024-07-30 02:48:32,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 942/ 3125], loss: 0.095, per_step_time: 1413ms, lr: 9.8705705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:32,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.66126 samples/s/p 3:18:36 } +2024-07-30 02:48:35,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 944/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 9.869788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:35,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.65944 samples/s/p 3:18:37 } +2024-07-30 02:48:38,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 946/ 3125], loss: 0.311, per_step_time: 1412ms, lr: 9.869004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:38,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.66181 samples/s/p 3:18:29 } +2024-07-30 02:48:41,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 948/ 3125], loss: 0.341, per_step_time: 1413ms, lr: 9.868218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:41,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.66049 samples/s/p 3:18:29 } +2024-07-30 02:48:44,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 950/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 9.867428e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:44,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.66136 samples/s/p 3:18:25 } +2024-07-30 02:48:47,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 952/ 3125], loss: 0.520, per_step_time: 1413ms, lr: 9.866637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:47,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.66108 samples/s/p 3:18:23 } +2024-07-30 02:48:49,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 954/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 9.865843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:49,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.66166 samples/s/p 3:18:18 } +2024-07-30 02:48:52,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 956/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 9.865046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:52,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.66004 samples/s/p 3:18:19 } +2024-07-30 02:48:55,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 958/ 3125], loss: 0.088, per_step_time: 1417ms, lr: 9.864249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:55,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.64560 samples/s/p 3:18:47 } +2024-07-30 02:48:58,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 960/ 3125], loss: 0.254, per_step_time: 1415ms, lr: 9.863448e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:48:58,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.65071 samples/s/p 3:18:33 } +2024-07-30 02:49:01,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 962/ 3125], loss: 0.118, per_step_time: 1422ms, lr: 9.862644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:01,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.62483 samples/s/p 3:19:25 } +2024-07-30 02:49:04,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 964/ 3125], loss: 0.348, per_step_time: 1413ms, lr: 9.861839e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:04,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.65807 samples/s/p 3:18:12 } +2024-07-30 02:49:06,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 966/ 3125], loss: 0.515, per_step_time: 1413ms, lr: 9.861032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:06,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.65870 samples/s/p 3:18:08 } +2024-07-30 02:49:09,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 968/ 3125], loss: 0.405, per_step_time: 1415ms, lr: 9.860221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:09,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.65066 samples/s/p 3:18:22 } +2024-07-30 02:49:12,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 970/ 3125], loss: 0.535, per_step_time: 1413ms, lr: 9.859409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:12,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.65862 samples/s/p 3:18:02 } +2024-07-30 02:49:15,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 972/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 9.858593e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:15,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.66001 samples/s/p 3:17:57 } +2024-07-30 02:49:18,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 974/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 9.8577775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:18,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.65911 samples/s/p 3:17:56 } +2024-07-30 02:49:21,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 976/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 9.856958e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:21,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.66139 samples/s/p 3:17:48 } +2024-07-30 02:49:23,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 978/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 9.856137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:23,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.66018 samples/s/p 3:17:48 } +2024-07-30 02:49:26,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 980/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 9.855313e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:26,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.66156 samples/s/p 3:17:42 } +2024-07-30 02:49:29,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 982/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 9.854486e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:29,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.65793 samples/s/p 3:17:47 } +2024-07-30 02:49:32,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 984/ 3125], loss: 0.367, per_step_time: 1413ms, lr: 9.8536575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:32,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.65982 samples/s/p 3:17:40 } +2024-07-30 02:49:35,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 986/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 9.852827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:35,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.66071 samples/s/p 3:17:35 } +2024-07-30 02:49:38,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 988/ 3125], loss: 0.293, per_step_time: 1413ms, lr: 9.851993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:38,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.66031 samples/s/p 3:17:33 } +2024-07-30 02:49:40,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 990/ 3125], loss: 0.241, per_step_time: 1414ms, lr: 9.851158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:40,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.65393 samples/s/p 3:17:44 } +2024-07-30 02:49:43,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 992/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 9.85032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:43,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.66131 samples/s/p 3:17:26 } +2024-07-30 02:49:46,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 994/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 9.849479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:46,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.65826 samples/s/p 3:17:29 } +2024-07-30 02:49:49,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 996/ 3125], loss: 0.733, per_step_time: 1414ms, lr: 9.848637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:49,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.65770 samples/s/p 3:17:27 } +2024-07-30 02:49:52,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 998/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 9.847792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:52,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.65558 samples/s/p 3:17:29 } +2024-07-30 02:49:55,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1000/ 3125], loss: 0.555, per_step_time: 1413ms, lr: 9.846945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:55,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.65776 samples/s/p 3:17:22 } +2024-07-30 02:49:57,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1002/ 3125], loss: 0.196, per_step_time: 1415ms, lr: 9.846096e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:49:57,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.65266 samples/s/p 3:17:29 } +2024-07-30 02:50:00,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1004/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 9.845244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:00,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.65851 samples/s/p 3:17:14 } +2024-07-30 02:50:03,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1006/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 9.84439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:03,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.65830 samples/s/p 3:17:12 } +2024-07-30 02:50:06,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1008/ 3125], loss: 0.251, per_step_time: 1414ms, lr: 9.843533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:06,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.65466 samples/s/p 3:17:17 } +2024-07-30 02:50:09,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1010/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 9.842675e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:09,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.65845 samples/s/p 3:17:06 } +2024-07-30 02:50:12,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1012/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 9.841814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:12,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.66021 samples/s/p 3:17:00 } +2024-07-30 02:50:14,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1014/ 3125], loss: 0.384, per_step_time: 1412ms, lr: 9.840951e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:14,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.66197 samples/s/p 3:16:53 } +2024-07-30 02:50:17,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1016/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 9.840085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:17,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.66021 samples/s/p 3:16:54 } +2024-07-30 02:50:20,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1018/ 3125], loss: 0.232, per_step_time: 1416ms, lr: 9.839217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:20,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.64673 samples/s/p 3:17:19 } +2024-07-30 02:50:23,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1020/ 3125], loss: 0.114, per_step_time: 1413ms, lr: 9.838346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:23,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.65935 samples/s/p 3:16:50 } +2024-07-30 02:50:26,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1022/ 3125], loss: 0.533, per_step_time: 1416ms, lr: 9.837474e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:26,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.64594 samples/s/p 3:17:15 } +2024-07-30 02:50:29,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1024/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 9.836599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:29,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.66018 samples/s/p 3:16:43 } +2024-07-30 02:50:31,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1026/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 9.835722e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:31,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.66123 samples/s/p 3:16:38 } +2024-07-30 02:50:34,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1028/ 3125], loss: 0.212, per_step_time: 1412ms, lr: 9.834843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:34,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.66195 samples/s/p 3:16:33 } +2024-07-30 02:50:37,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1030/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 9.833961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:37,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.66070 samples/s/p 3:16:33 } +2024-07-30 02:50:40,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1032/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 9.833077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:40,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.65970 samples/s/p 3:16:32 } +2024-07-30 02:50:43,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1034/ 3125], loss: 0.209, per_step_time: 1412ms, lr: 9.83219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:43,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.66234 samples/s/p 3:16:24 } +2024-07-30 02:50:46,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1036/ 3125], loss: 0.252, per_step_time: 1412ms, lr: 9.831302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:46,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.66232 samples/s/p 3:16:21 } +2024-07-30 02:50:48,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1038/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 9.83041e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:48,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.65940 samples/s/p 3:16:24 } +2024-07-30 02:50:51,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1040/ 3125], loss: 0.089, per_step_time: 1413ms, lr: 9.829518e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:51,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.66153 samples/s/p 3:16:17 } +2024-07-30 02:50:54,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1042/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 9.828622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:54,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.66026 samples/s/p 3:16:17 } +2024-07-30 02:50:57,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1044/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 9.827724e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:50:57,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.66055 samples/s/p 3:16:14 } +2024-07-30 02:51:00,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1046/ 3125], loss: 0.345, per_step_time: 1414ms, lr: 9.826823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:00,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.65703 samples/s/p 3:16:18 } +2024-07-30 02:51:03,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1048/ 3125], loss: 0.387, per_step_time: 1414ms, lr: 9.825921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:03,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.65750 samples/s/p 3:16:14 } +2024-07-30 02:51:05,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1050/ 3125], loss: 0.237, per_step_time: 1414ms, lr: 9.825016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:05,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.65596 samples/s/p 3:16:15 } +2024-07-30 02:51:08,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1052/ 3125], loss: 0.115, per_step_time: 1413ms, lr: 9.824109e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:08,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.66058 samples/s/p 3:16:02 } +2024-07-30 02:51:11,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1054/ 3125], loss: 0.151, per_step_time: 1414ms, lr: 9.8231985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:11,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.65709 samples/s/p 3:16:07 } +2024-07-30 02:51:14,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1056/ 3125], loss: 0.353, per_step_time: 1413ms, lr: 9.822287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:14,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.66009 samples/s/p 3:15:58 } +2024-07-30 02:51:17,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1058/ 3125], loss: 0.219, per_step_time: 1416ms, lr: 9.821373e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:17,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.64685 samples/s/p 3:16:22 } +2024-07-30 02:51:20,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1060/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 9.820457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:20,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.66064 samples/s/p 3:15:51 } +2024-07-30 02:51:22,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1062/ 3125], loss: 0.295, per_step_time: 1415ms, lr: 9.819539e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:22,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.65247 samples/s/p 3:16:05 } +2024-07-30 02:51:25,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1064/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 9.8186165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:25,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.66117 samples/s/p 3:15:44 } +2024-07-30 02:51:28,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1066/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 9.817693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:28,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.65996 samples/s/p 3:15:44 } +2024-07-30 02:51:31,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1068/ 3125], loss: 0.271, per_step_time: 1412ms, lr: 9.8167675e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:31,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.66261 samples/s/p 3:15:35 } +2024-07-30 02:51:34,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1070/ 3125], loss: 0.564, per_step_time: 1413ms, lr: 9.815841e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:34,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.65880 samples/s/p 3:15:40 } +2024-07-30 02:51:37,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1072/ 3125], loss: 0.245, per_step_time: 1412ms, lr: 9.81491e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:37,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.66185 samples/s/p 3:15:31 } +2024-07-30 02:51:39,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1074/ 3125], loss: 0.383, per_step_time: 1414ms, lr: 9.813978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:39,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.65673 samples/s/p 3:15:39 } +2024-07-30 02:51:42,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1076/ 3125], loss: 0.429, per_step_time: 1413ms, lr: 9.813043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:42,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.66029 samples/s/p 3:15:29 } +2024-07-30 02:51:45,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1078/ 3125], loss: 0.408, per_step_time: 1413ms, lr: 9.812105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:45,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.66137 samples/s/p 3:15:24 } +2024-07-30 02:51:48,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1080/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 9.811166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:48,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.66170 samples/s/p 3:15:20 } +2024-07-30 02:51:51,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1082/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 9.810225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:51,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.65908 samples/s/p 3:15:23 } +2024-07-30 02:51:54,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1084/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 9.8092805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:54,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.66042 samples/s/p 3:15:17 } +2024-07-30 02:51:56,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1086/ 3125], loss: 0.335, per_step_time: 1412ms, lr: 9.808335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:56,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.66253 samples/s/p 3:15:10 } +2024-07-30 02:51:59,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1088/ 3125], loss: 0.302, per_step_time: 1416ms, lr: 9.807386e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:51:59,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.64785 samples/s/p 3:15:38 } +2024-07-30 02:52:02,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1090/ 3125], loss: 0.307, per_step_time: 1415ms, lr: 9.806435e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:02,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.65082 samples/s/p 3:15:29 } +2024-07-30 02:52:05,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1092/ 3125], loss: 0.224, per_step_time: 1415ms, lr: 9.8054825e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:05,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.65131 samples/s/p 3:15:25 } +2024-07-30 02:52:08,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1094/ 3125], loss: 0.178, per_step_time: 1415ms, lr: 9.804527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:08,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.65326 samples/s/p 3:15:18 } +2024-07-30 02:52:11,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1096/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 9.803569e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:11,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.65936 samples/s/p 3:15:03 } +2024-07-30 02:52:13,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1098/ 3125], loss: 0.200, per_step_time: 1414ms, lr: 9.8026085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:13,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.65764 samples/s/p 3:15:03 } +2024-07-30 02:52:16,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1100/ 3125], loss: 0.426, per_step_time: 1413ms, lr: 9.801647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:16,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.65773 samples/s/p 3:15:00 } +2024-07-30 02:52:19,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1102/ 3125], loss: 0.628, per_step_time: 1413ms, lr: 9.800682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:19,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.65864 samples/s/p 3:14:56 } +2024-07-30 02:52:22,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1104/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 9.799715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:22,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.66134 samples/s/p 3:14:47 } +2024-07-30 02:52:25,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1106/ 3125], loss: 0.322, per_step_time: 1413ms, lr: 9.798746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:25,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.66113 samples/s/p 3:14:45 } +2024-07-30 02:52:28,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1108/ 3125], loss: 0.553, per_step_time: 1413ms, lr: 9.7977745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:28,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.65988 samples/s/p 3:14:45 } +2024-07-30 02:52:30,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1110/ 3125], loss: 0.215, per_step_time: 1412ms, lr: 9.7968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:30,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.66215 samples/s/p 3:14:37 } +2024-07-30 02:52:33,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1112/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 9.795824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:33,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.65886 samples/s/p 3:14:41 } +2024-07-30 02:52:36,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1114/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 9.794847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:36,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.66005 samples/s/p 3:14:36 } +2024-07-30 02:52:39,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1116/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 9.7938655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:39,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.65999 samples/s/p 3:14:33 } +2024-07-30 02:52:42,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1118/ 3125], loss: 0.401, per_step_time: 1413ms, lr: 9.792882e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:42,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.66135 samples/s/p 3:14:27 } +2024-07-30 02:52:45,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1120/ 3125], loss: 0.297, per_step_time: 1412ms, lr: 9.791896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:45,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.66172 samples/s/p 3:14:24 } +2024-07-30 02:52:47,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1122/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 9.790909e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:47,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |█████ | 5.65774 samples/s/p 3:14:29 } +2024-07-30 02:52:50,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1124/ 3125], loss: 0.094, per_step_time: 1416ms, lr: 9.789919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:50,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |█████ | 5.64852 samples/s/p 3:14:45 } +2024-07-30 02:52:53,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1126/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 9.788928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:53,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.65883 samples/s/p 3:14:21 } +2024-07-30 02:52:56,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1128/ 3125], loss: 0.300, per_step_time: 1416ms, lr: 9.787934e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:56,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.64633 samples/s/p 3:14:44 } +2024-07-30 02:52:59,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1130/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 9.786936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:52:59,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.66024 samples/s/p 3:14:13 } +2024-07-30 02:53:02,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1132/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 9.785938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:02,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.65873 samples/s/p 3:14:13 } +2024-07-30 02:53:05,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1134/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 9.784937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:05,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.65966 samples/s/p 3:14:08 } +2024-07-30 02:53:07,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1136/ 3125], loss: 0.150, per_step_time: 1412ms, lr: 9.783933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:07,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.66233 samples/s/p 3:14:00 } +2024-07-30 02:53:10,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1138/ 3125], loss: 0.158, per_step_time: 1414ms, lr: 9.782927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:10,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.65531 samples/s/p 3:14:12 } +2024-07-30 02:53:13,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1140/ 3125], loss: 0.321, per_step_time: 1413ms, lr: 9.781919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:13,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.66038 samples/s/p 3:13:58 } +2024-07-30 02:53:16,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1142/ 3125], loss: 0.248, per_step_time: 1414ms, lr: 9.780909e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:16,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.65658 samples/s/p 3:14:03 } +2024-07-30 02:53:19,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1144/ 3125], loss: 0.359, per_step_time: 1414ms, lr: 9.779896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:19,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.65399 samples/s/p 3:14:06 } +2024-07-30 02:53:22,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1146/ 3125], loss: 0.302, per_step_time: 1414ms, lr: 9.778881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:22,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.65713 samples/s/p 3:13:56 } +2024-07-30 02:53:24,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1148/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 9.777864e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:24,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.65938 samples/s/p 3:13:49 } +2024-07-30 02:53:27,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1150/ 3125], loss: 0.211, per_step_time: 1414ms, lr: 9.776844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:27,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.65597 samples/s/p 3:13:53 } +2024-07-30 02:53:30,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1152/ 3125], loss: 0.408, per_step_time: 1413ms, lr: 9.775823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:30,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.66123 samples/s/p 3:13:40 } +2024-07-30 02:53:33,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1154/ 3125], loss: 0.170, per_step_time: 1414ms, lr: 9.774798e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:33,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.65677 samples/s/p 3:13:46 } +2024-07-30 02:53:36,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1156/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 9.773771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:36,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.65871 samples/s/p 3:13:39 } +2024-07-30 02:53:39,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1158/ 3125], loss: 0.134, per_step_time: 1413ms, lr: 9.772743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:39,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.66030 samples/s/p 3:13:33 } +2024-07-30 02:53:41,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1160/ 3125], loss: 0.465, per_step_time: 1412ms, lr: 9.771713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:41,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.66210 samples/s/p 3:13:27 } +2024-07-30 02:53:44,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1162/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 9.770679e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:44,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.65858 samples/s/p 3:13:31 } +2024-07-30 02:53:47,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1164/ 3125], loss: 0.082, per_step_time: 1413ms, lr: 9.769644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:47,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.65878 samples/s/p 3:13:28 } +2024-07-30 02:53:50,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1166/ 3125], loss: 0.355, per_step_time: 1412ms, lr: 9.768606e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:50,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.66311 samples/s/p 3:13:16 } +2024-07-30 02:53:53,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1168/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 9.767566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:53,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.66036 samples/s/p 3:13:19 } +2024-07-30 02:53:56,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1170/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 9.766523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:56,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.66155 samples/s/p 3:13:14 } +2024-07-30 02:53:58,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1172/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 9.765479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:53:58,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.65799 samples/s/p 3:13:18 } +2024-07-30 02:54:01,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1174/ 3125], loss: 0.124, per_step_time: 1416ms, lr: 9.764432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:01,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.64939 samples/s/p 3:13:33 } +2024-07-30 02:54:04,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1176/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 9.763384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:04,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.65920 samples/s/p 3:13:10 } +2024-07-30 02:54:07,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1178/ 3125], loss: 0.391, per_step_time: 1414ms, lr: 9.762332e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:07,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.65466 samples/s/p 3:13:16 } +2024-07-30 02:54:10,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1180/ 3125], loss: 0.177, per_step_time: 1414ms, lr: 9.761278e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:10,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.65566 samples/s/p 3:13:11 } +2024-07-30 02:54:13,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1182/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 9.760222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:13,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.65843 samples/s/p 3:13:03 } +2024-07-30 02:54:15,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1184/ 3125], loss: 0.159, per_step_time: 1414ms, lr: 9.759164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:15,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.65627 samples/s/p 3:13:05 } +2024-07-30 02:54:18,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1186/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 9.758104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:18,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.65863 samples/s/p 3:12:57 } +2024-07-30 02:54:21,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1188/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 9.75704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:21,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.65999 samples/s/p 3:12:51 } +2024-07-30 02:54:24,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1190/ 3125], loss: 0.580, per_step_time: 1413ms, lr: 9.755976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:24,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.66123 samples/s/p 3:12:46 } +2024-07-30 02:54:27,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1192/ 3125], loss: 0.446, per_step_time: 1413ms, lr: 9.754908e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:27,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.66004 samples/s/p 3:12:45 } +2024-07-30 02:54:30,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1194/ 3125], loss: 0.293, per_step_time: 1413ms, lr: 9.75384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:30,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.66013 samples/s/p 3:12:42 } +2024-07-30 02:54:32,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1196/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 9.752767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:32,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.66102 samples/s/p 3:12:38 } +2024-07-30 02:54:35,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1198/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 9.751693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:35,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.65845 samples/s/p 3:12:40 } +2024-07-30 02:54:38,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1200/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 9.750616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:38,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.65784 samples/s/p 3:12:39 } +2024-07-30 02:54:41,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1202/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 9.749538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:41,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.65897 samples/s/p 3:12:34 } +2024-07-30 02:54:44,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1204/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 9.748457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:44,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.66131 samples/s/p 3:12:26 } +2024-07-30 02:54:47,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1206/ 3125], loss: 0.336, per_step_time: 1414ms, lr: 9.747374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:47,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.65739 samples/s/p 3:12:31 } +2024-07-30 02:54:49,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1208/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 9.746288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:49,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.66002 samples/s/p 3:12:23 } +2024-07-30 02:54:52,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1210/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 9.7452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:52,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.65978 samples/s/p 3:12:21 } +2024-07-30 02:54:55,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1212/ 3125], loss: 0.112, per_step_time: 1413ms, lr: 9.744111e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:55,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.65781 samples/s/p 3:12:22 } +2024-07-30 02:54:58,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1214/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 9.7430175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:54:58,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.66014 samples/s/p 3:12:14 } +2024-07-30 02:55:01,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1216/ 3125], loss: 0.415, per_step_time: 1413ms, lr: 9.741923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:01,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.66069 samples/s/p 3:12:10 } +2024-07-30 02:55:04,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1218/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 9.7408265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:04,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.65895 samples/s/p 3:12:11 } +2024-07-30 02:55:06,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1220/ 3125], loss: 0.406, per_step_time: 1417ms, lr: 9.739729e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:06,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.64209 samples/s/p 3:12:43 } +2024-07-30 02:55:09,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1222/ 3125], loss: 0.280, per_step_time: 1416ms, lr: 9.738626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:09,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.64775 samples/s/p 3:12:28 } +2024-07-30 02:55:12,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1224/ 3125], loss: 0.308, per_step_time: 1426ms, lr: 9.737523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:12,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.60756 samples/s/p 3:13:48 } +2024-07-30 02:55:15,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1226/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 9.736417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:15,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.66020 samples/s/p 3:11:57 } +2024-07-30 02:55:18,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1228/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 9.7353095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:18,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.66064 samples/s/p 3:11:53 } +2024-07-30 02:55:21,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1230/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 9.734199e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:21,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.66044 samples/s/p 3:11:51 } +2024-07-30 02:55:23,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1232/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 9.733087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:23,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.65875 samples/s/p 3:11:52 } +2024-07-30 02:55:26,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1234/ 3125], loss: 0.403, per_step_time: 1414ms, lr: 9.731971e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:26,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.65546 samples/s/p 3:11:55 } +2024-07-30 02:55:29,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1236/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 9.730855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:29,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.65913 samples/s/p 3:11:45 } +2024-07-30 02:55:32,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1238/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 9.729735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:32,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.66029 samples/s/p 3:11:40 } +2024-07-30 02:55:35,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1240/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 9.728614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:35,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.66061 samples/s/p 3:11:36 } +2024-07-30 02:55:38,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1242/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 9.727489e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:38,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.66021 samples/s/p 3:11:34 } +2024-07-30 02:55:40,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1244/ 3125], loss: 0.158, per_step_time: 1412ms, lr: 9.726363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:40,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.66180 samples/s/p 3:11:28 } +2024-07-30 02:55:43,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1246/ 3125], loss: 0.466, per_step_time: 1414ms, lr: 9.725235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:43,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.65531 samples/s/p 3:11:39 } +2024-07-30 02:55:46,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1248/ 3125], loss: 0.301, per_step_time: 1413ms, lr: 9.7241045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:46,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.66106 samples/s/p 3:11:24 } +2024-07-30 02:55:49,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1250/ 3125], loss: 0.301, per_step_time: 1415ms, lr: 9.722971e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:49,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.65170 samples/s/p 3:11:40 } +2024-07-30 02:55:52,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1252/ 3125], loss: 0.246, per_step_time: 1415ms, lr: 9.721835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:52,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.65238 samples/s/p 3:11:36 } +2024-07-30 02:55:55,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1254/ 3125], loss: 0.269, per_step_time: 1414ms, lr: 9.7206985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:55,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.65539 samples/s/p 3:11:27 } +2024-07-30 02:55:57,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1256/ 3125], loss: 0.186, per_step_time: 1412ms, lr: 9.719559e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:55:57,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.66311 samples/s/p 3:11:09 } +2024-07-30 02:56:00,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1258/ 3125], loss: 0.373, per_step_time: 1413ms, lr: 9.718417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:00,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.66031 samples/s/p 3:11:12 } +2024-07-30 02:56:03,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1260/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 9.717272e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:03,617 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.66061 samples/s/p 3:11:08 } +2024-07-30 02:56:06,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1262/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 9.716126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:06,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.66006 samples/s/p 3:11:07 } +2024-07-30 02:56:09,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1264/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 9.714978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:09,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.66085 samples/s/p 3:11:02 } +2024-07-30 02:56:12,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1266/ 3125], loss: 0.501, per_step_time: 1413ms, lr: 9.713827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:12,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.66167 samples/s/p 3:10:58 } +2024-07-30 02:56:14,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1268/ 3125], loss: 0.166, per_step_time: 1417ms, lr: 9.712674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:14,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.64258 samples/s/p 3:11:34 } +2024-07-30 02:56:17,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1270/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 9.711518e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:17,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.65938 samples/s/p 3:10:57 } +2024-07-30 02:56:20,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1272/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 9.71036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:20,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.65945 samples/s/p 3:10:54 } +2024-07-30 02:56:23,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1274/ 3125], loss: 0.331, per_step_time: 1414ms, lr: 9.709201e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:23,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.65767 samples/s/p 3:10:54 } +2024-07-30 02:56:26,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1276/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 9.708038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:26,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.65974 samples/s/p 3:10:47 } +2024-07-30 02:56:29,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1278/ 3125], loss: 0.248, per_step_time: 1414ms, lr: 9.706873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:29,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.65726 samples/s/p 3:10:50 } +2024-07-30 02:56:31,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1280/ 3125], loss: 0.137, per_step_time: 1414ms, lr: 9.705706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:31,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.65745 samples/s/p 3:10:46 } +2024-07-30 02:56:34,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1282/ 3125], loss: 0.208, per_step_time: 1415ms, lr: 9.704539e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:34,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.65141 samples/s/p 3:10:56 } +2024-07-30 02:56:37,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1284/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 9.703367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:37,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.66073 samples/s/p 3:10:34 } +2024-07-30 02:56:40,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1286/ 3125], loss: 0.480, per_step_time: 1416ms, lr: 9.702194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:40,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.64838 samples/s/p 3:10:56 } +2024-07-30 02:56:43,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1288/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 9.701018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:43,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.66139 samples/s/p 3:10:27 } +2024-07-30 02:56:46,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1290/ 3125], loss: 0.396, per_step_time: 1412ms, lr: 9.69984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:46,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.66200 samples/s/p 3:10:23 } +2024-07-30 02:56:48,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1292/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 9.6986605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:48,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.66080 samples/s/p 3:10:23 } +2024-07-30 02:56:51,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1294/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 9.697477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:51,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.65826 samples/s/p 3:10:25 } +2024-07-30 02:56:54,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1296/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 9.696292e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:54,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.65824 samples/s/p 3:10:22 } +2024-07-30 02:56:57,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1298/ 3125], loss: 0.426, per_step_time: 1413ms, lr: 9.695105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:56:57,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.66100 samples/s/p 3:10:14 } +2024-07-30 02:57:00,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1300/ 3125], loss: 0.553, per_step_time: 1418ms, lr: 9.693917e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:00,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.64038 samples/s/p 3:10:53 } +2024-07-30 02:57:03,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1302/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 9.692725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:03,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.66082 samples/s/p 3:10:08 } +2024-07-30 02:57:05,991 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1304/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 9.691531e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:05,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.66166 samples/s/p 3:10:04 } +2024-07-30 02:57:08,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1306/ 3125], loss: 0.382, per_step_time: 1413ms, lr: 9.690336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:08,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.66086 samples/s/p 3:10:03 } +2024-07-30 02:57:11,659 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1308/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 9.689138e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:11,660 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.65785 samples/s/p 3:10:06 } +2024-07-30 02:57:14,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1310/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 9.687938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:14,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.66004 samples/s/p 3:09:59 } +2024-07-30 02:57:17,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1312/ 3125], loss: 0.122, per_step_time: 1412ms, lr: 9.686734e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:17,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.66275 samples/s/p 3:09:50 } +2024-07-30 02:57:20,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1314/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 9.685529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:20,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |███████ | 5.65827 samples/s/p 3:09:57 } +2024-07-30 02:57:22,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1316/ 3125], loss: 0.242, per_step_time: 1414ms, lr: 9.684323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:22,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |███████ | 5.65541 samples/s/p 3:10:00 } +2024-07-30 02:57:25,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1318/ 3125], loss: 0.170, per_step_time: 1412ms, lr: 9.683114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:25,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.66181 samples/s/p 3:09:44 } +2024-07-30 02:57:28,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1320/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 9.681902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:28,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.65922 samples/s/p 3:09:46 } +2024-07-30 02:57:31,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1322/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 9.680688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:31,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.65866 samples/s/p 3:09:45 } +2024-07-30 02:57:34,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1324/ 3125], loss: 0.306, per_step_time: 1412ms, lr: 9.679472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:34,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.66270 samples/s/p 3:09:34 } +2024-07-30 02:57:37,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1326/ 3125], loss: 0.458, per_step_time: 1413ms, lr: 9.678254e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:37,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.65951 samples/s/p 3:09:37 } +2024-07-30 02:57:40,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1328/ 3125], loss: 0.322, per_step_time: 1413ms, lr: 9.677034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:40,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.65813 samples/s/p 3:09:37 } +2024-07-30 02:57:42,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1330/ 3125], loss: 0.384, per_step_time: 1413ms, lr: 9.67581e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:42,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.65859 samples/s/p 3:09:33 } +2024-07-30 02:57:45,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1332/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 9.674586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:45,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.66117 samples/s/p 3:09:25 } +2024-07-30 02:57:48,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1334/ 3125], loss: 0.160, per_step_time: 1413ms, lr: 9.673359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:48,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.65785 samples/s/p 3:09:29 } +2024-07-30 02:57:51,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1336/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 9.67213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:51,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.65613 samples/s/p 3:09:30 } +2024-07-30 02:57:54,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1338/ 3125], loss: 0.599, per_step_time: 1413ms, lr: 9.670897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:54,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.66076 samples/s/p 3:09:18 } +2024-07-30 02:57:57,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1340/ 3125], loss: 0.408, per_step_time: 1414ms, lr: 9.669664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:57,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.65384 samples/s/p 3:09:29 } +2024-07-30 02:57:59,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1342/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 9.668427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:57:59,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.66071 samples/s/p 3:09:12 } +2024-07-30 02:58:02,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1344/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 9.667189e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:02,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.65801 samples/s/p 3:09:15 } +2024-07-30 02:58:05,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1346/ 3125], loss: 0.354, per_step_time: 1412ms, lr: 9.665949e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:05,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.66234 samples/s/p 3:09:03 } +2024-07-30 02:58:08,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1348/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 9.664705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:08,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.66135 samples/s/p 3:09:02 } +2024-07-30 02:58:11,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1350/ 3125], loss: 0.249, per_step_time: 1412ms, lr: 9.663461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:11,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.66458 samples/s/p 3:08:53 } +2024-07-30 02:58:14,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1352/ 3125], loss: 0.442, per_step_time: 1413ms, lr: 9.662214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:14,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.65951 samples/s/p 3:09:00 } +2024-07-30 02:58:16,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1354/ 3125], loss: 0.305, per_step_time: 1412ms, lr: 9.660965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:16,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.66265 samples/s/p 3:08:51 } +2024-07-30 02:58:19,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1356/ 3125], loss: 0.162, per_step_time: 1414ms, lr: 9.659713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:19,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.65730 samples/s/p 3:08:59 } +2024-07-30 02:58:22,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1358/ 3125], loss: 0.118, per_step_time: 1413ms, lr: 9.658459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:22,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.66106 samples/s/p 3:08:49 } +2024-07-30 02:58:25,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1360/ 3125], loss: 0.098, per_step_time: 1425ms, lr: 9.657203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:25,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.61353 samples/s/p 3:10:22 } +2024-07-30 02:58:28,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1362/ 3125], loss: 0.471, per_step_time: 1413ms, lr: 9.655945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:28,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.65990 samples/s/p 3:08:45 } +2024-07-30 02:58:31,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1364/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 9.654684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:31,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.66052 samples/s/p 3:08:41 } +2024-07-30 02:58:33,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1366/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 9.65342e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:33,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.65797 samples/s/p 3:08:44 } +2024-07-30 02:58:36,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1368/ 3125], loss: 0.169, per_step_time: 1413ms, lr: 9.652156e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:36,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.66153 samples/s/p 3:08:34 } +2024-07-30 02:58:39,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1370/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 9.650888e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:39,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.65976 samples/s/p 3:08:34 } +2024-07-30 02:58:42,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1372/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 9.64962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:42,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.66114 samples/s/p 3:08:29 } +2024-07-30 02:58:45,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1374/ 3125], loss: 0.228, per_step_time: 1412ms, lr: 9.648348e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:45,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.66178 samples/s/p 3:08:25 } +2024-07-30 02:58:48,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1376/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 9.647073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:48,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.66048 samples/s/p 3:08:25 } +2024-07-30 02:58:50,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1378/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 9.645798e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:50,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.65853 samples/s/p 3:08:26 } +2024-07-30 02:58:53,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1380/ 3125], loss: 0.612, per_step_time: 1413ms, lr: 9.64452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:53,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.66067 samples/s/p 3:08:19 } +2024-07-30 02:58:56,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1382/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 9.643239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:56,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.65814 samples/s/p 3:08:21 } +2024-07-30 02:58:59,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1384/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 9.641956e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:58:59,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.65969 samples/s/p 3:08:15 } +2024-07-30 02:59:02,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1386/ 3125], loss: 0.271, per_step_time: 1415ms, lr: 9.640671e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:02,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.65222 samples/s/p 3:08:27 } +2024-07-30 02:59:05,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1388/ 3125], loss: 0.386, per_step_time: 1414ms, lr: 9.639384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:05,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.65725 samples/s/p 3:08:14 } +2024-07-30 02:59:07,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1390/ 3125], loss: 0.425, per_step_time: 1412ms, lr: 9.6380945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:07,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.66198 samples/s/p 3:08:02 } +2024-07-30 02:59:10,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1392/ 3125], loss: 0.252, per_step_time: 1414ms, lr: 9.636802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:10,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.65394 samples/s/p 3:08:15 } +2024-07-30 02:59:13,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1394/ 3125], loss: 0.226, per_step_time: 1414ms, lr: 9.635509e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:13,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.65655 samples/s/p 3:08:07 } +2024-07-30 02:59:16,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1396/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 9.634213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:16,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.66127 samples/s/p 3:07:55 } +2024-07-30 02:59:19,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1398/ 3125], loss: 0.431, per_step_time: 1413ms, lr: 9.632915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:19,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.66034 samples/s/p 3:07:54 } +2024-07-30 02:59:22,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1400/ 3125], loss: 0.280, per_step_time: 1414ms, lr: 9.6316135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:22,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.65751 samples/s/p 3:07:57 } +2024-07-30 02:59:22,059 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 02:59:56,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1402/ 3125], loss: 0.537, per_step_time: 1824ms, lr: 9.630311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:56,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 4.38374 samples/s/p 4:02:30 } +2024-07-30 02:59:59,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1404/ 3125], loss: 0.321, per_step_time: 1414ms, lr: 9.629006e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 02:59:59,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.65681 samples/s/p 3:07:52 } +2024-07-30 03:00:02,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1406/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 9.6277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:02,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.65837 samples/s/p 3:07:46 } +2024-07-30 03:00:05,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1408/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 9.62639e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:05,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.66022 samples/s/p 3:07:40 } +2024-07-30 03:00:08,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1410/ 3125], loss: 0.320, per_step_time: 1413ms, lr: 9.625078e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:08,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.65895 samples/s/p 3:07:40 } +2024-07-30 03:00:11,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1412/ 3125], loss: 0.263, per_step_time: 1415ms, lr: 9.6237645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:11,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.65180 samples/s/p 3:07:51 } +2024-07-30 03:00:14,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1414/ 3125], loss: 0.153, per_step_time: 1414ms, lr: 9.6224485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:14,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.65630 samples/s/p 3:07:39 } +2024-07-30 03:00:17,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1416/ 3125], loss: 0.109, per_step_time: 1413ms, lr: 9.621131e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:17,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.66051 samples/s/p 3:07:28 } +2024-07-30 03:00:19,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1418/ 3125], loss: 0.217, per_step_time: 1412ms, lr: 9.61981e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:19,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.66203 samples/s/p 3:07:22 } +2024-07-30 03:00:22,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1420/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 9.618488e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:22,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.66134 samples/s/p 3:07:21 } +2024-07-30 03:00:25,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1422/ 3125], loss: 0.702, per_step_time: 1413ms, lr: 9.617163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:25,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.66071 samples/s/p 3:07:19 } +2024-07-30 03:00:28,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1424/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 9.615836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:28,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.65987 samples/s/p 3:07:18 } +2024-07-30 03:00:31,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1426/ 3125], loss: 0.307, per_step_time: 1414ms, lr: 9.614508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:31,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.65640 samples/s/p 3:07:22 } +2024-07-30 03:00:34,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1428/ 3125], loss: 0.406, per_step_time: 1413ms, lr: 9.613175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:34,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.66084 samples/s/p 3:07:10 } +2024-07-30 03:00:36,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1430/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 9.611842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:36,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.66170 samples/s/p 3:07:06 } +2024-07-30 03:00:39,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1432/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 9.610506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:39,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.65981 samples/s/p 3:07:07 } +2024-07-30 03:00:42,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1434/ 3125], loss: 0.264, per_step_time: 1416ms, lr: 9.609167e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:42,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.64874 samples/s/p 3:07:26 } +2024-07-30 03:00:45,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1436/ 3125], loss: 0.493, per_step_time: 1413ms, lr: 9.607828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:45,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.66035 samples/s/p 3:07:00 } +2024-07-30 03:00:48,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1438/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 9.606485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:48,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.66086 samples/s/p 3:06:56 } +2024-07-30 03:00:51,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1440/ 3125], loss: 0.302, per_step_time: 1412ms, lr: 9.605141e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:51,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.66274 samples/s/p 3:06:50 } +2024-07-30 03:00:53,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1442/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 9.603795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:53,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.66046 samples/s/p 3:06:51 } +2024-07-30 03:00:56,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1444/ 3125], loss: 0.148, per_step_time: 1417ms, lr: 9.602445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:56,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.64350 samples/s/p 3:07:22 } +2024-07-30 03:00:59,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1446/ 3125], loss: 0.254, per_step_time: 1416ms, lr: 9.601094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:00:59,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.64654 samples/s/p 3:07:13 } +2024-07-30 03:01:02,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1448/ 3125], loss: 0.198, per_step_time: 1416ms, lr: 9.599741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:02,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.64895 samples/s/p 3:07:06 } +2024-07-30 03:01:05,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1450/ 3125], loss: 0.306, per_step_time: 1419ms, lr: 9.598385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:05,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.63406 samples/s/p 3:07:32 } +2024-07-30 03:01:08,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1452/ 3125], loss: 0.187, per_step_time: 1421ms, lr: 9.597027e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:08,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.62822 samples/s/p 3:07:41 } +2024-07-30 03:01:10,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1454/ 3125], loss: 0.147, per_step_time: 1419ms, lr: 9.595667e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:10,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.63652 samples/s/p 3:07:22 } +2024-07-30 03:01:13,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1456/ 3125], loss: 0.250, per_step_time: 1427ms, lr: 9.594305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:13,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.60566 samples/s/p 3:08:21 } +2024-07-30 03:01:16,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1458/ 3125], loss: 0.402, per_step_time: 1418ms, lr: 9.592941e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:16,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.63892 samples/s/p 3:07:11 } +2024-07-30 03:01:19,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1460/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 9.591575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:19,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.65886 samples/s/p 3:06:29 } +2024-07-30 03:01:22,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1462/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 9.590206e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:22,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.65839 samples/s/p 3:06:27 } +2024-07-30 03:01:25,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1464/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 9.588835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:25,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.65800 samples/s/p 3:06:25 } +2024-07-30 03:01:28,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1466/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 9.587462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:28,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.66012 samples/s/p 3:06:18 } +2024-07-30 03:01:30,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1468/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 9.586086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:30,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.65770 samples/s/p 3:06:20 } +2024-07-30 03:01:33,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1470/ 3125], loss: 0.303, per_step_time: 1414ms, lr: 9.584708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:33,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.65529 samples/s/p 3:06:22 } +2024-07-30 03:01:36,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1472/ 3125], loss: 0.148, per_step_time: 1413ms, lr: 9.583328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:36,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.65932 samples/s/p 3:06:11 } +2024-07-30 03:01:39,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1474/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 9.581947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:39,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.66063 samples/s/p 3:06:06 } +2024-07-30 03:01:42,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1476/ 3125], loss: 0.335, per_step_time: 1416ms, lr: 9.580563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:42,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.64802 samples/s/p 3:06:28 } +2024-07-30 03:01:45,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1478/ 3125], loss: 0.367, per_step_time: 1413ms, lr: 9.579177e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:45,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.65945 samples/s/p 3:06:02 } +2024-07-30 03:01:47,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1480/ 3125], loss: 0.177, per_step_time: 1418ms, lr: 9.577788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:47,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.63800 samples/s/p 3:06:42 } +2024-07-30 03:01:50,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1482/ 3125], loss: 0.156, per_step_time: 1421ms, lr: 9.576398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:50,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.62870 samples/s/p 3:06:58 } +2024-07-30 03:01:53,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1484/ 3125], loss: 0.288, per_step_time: 1414ms, lr: 9.575005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:53,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.65563 samples/s/p 3:06:01 } +2024-07-30 03:01:56,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1486/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 9.5736095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:56,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.65429 samples/s/p 3:06:01 } +2024-07-30 03:01:59,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1488/ 3125], loss: 0.203, per_step_time: 1416ms, lr: 9.572213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:01:59,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.64727 samples/s/p 3:06:12 } +2024-07-30 03:02:02,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1490/ 3125], loss: 0.331, per_step_time: 1412ms, lr: 9.570813e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:02,089 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.66246 samples/s/p 3:05:40 } +2024-07-30 03:02:04,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1492/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 9.569411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:04,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.65822 samples/s/p 3:05:45 } +2024-07-30 03:02:07,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1494/ 3125], loss: 0.445, per_step_time: 1413ms, lr: 9.568008e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:07,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.66134 samples/s/p 3:05:36 } +2024-07-30 03:02:10,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1496/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 9.566602e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:10,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |███████ | 5.65828 samples/s/p 3:05:39 } +2024-07-30 03:02:13,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1498/ 3125], loss: 0.205, per_step_time: 1414ms, lr: 9.565194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:13,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |███████ | 5.65631 samples/s/p 3:05:40 } +2024-07-30 03:02:16,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1500/ 3125], loss: 0.385, per_step_time: 1413ms, lr: 9.563783e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:16,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.65923 samples/s/p 3:05:32 } +2024-07-30 03:02:19,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1502/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 9.562372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:19,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.65989 samples/s/p 3:05:28 } +2024-07-30 03:02:21,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1504/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 9.560956e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:21,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.65919 samples/s/p 3:05:26 } +2024-07-30 03:02:24,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1506/ 3125], loss: 0.245, per_step_time: 1412ms, lr: 9.55954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:24,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.66178 samples/s/p 3:05:18 } +2024-07-30 03:02:27,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1508/ 3125], loss: 0.276, per_step_time: 1414ms, lr: 9.558121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:27,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.65647 samples/s/p 3:05:26 } +2024-07-30 03:02:30,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1510/ 3125], loss: 0.249, per_step_time: 1416ms, lr: 9.556699e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:30,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.64849 samples/s/p 3:05:39 } +2024-07-30 03:02:33,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1512/ 3125], loss: 0.125, per_step_time: 1413ms, lr: 9.555276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:33,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.65772 samples/s/p 3:05:18 } +2024-07-30 03:02:36,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1514/ 3125], loss: 0.294, per_step_time: 1413ms, lr: 9.553851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:36,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.66009 samples/s/p 3:05:10 } +2024-07-30 03:02:38,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1516/ 3125], loss: 0.127, per_step_time: 1413ms, lr: 9.552423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:38,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.66129 samples/s/p 3:05:05 } +2024-07-30 03:02:41,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1518/ 3125], loss: 0.398, per_step_time: 1415ms, lr: 9.550993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:41,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.65256 samples/s/p 3:05:19 } +2024-07-30 03:02:44,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1520/ 3125], loss: 0.232, per_step_time: 1412ms, lr: 9.549562e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:44,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.66213 samples/s/p 3:04:58 } +2024-07-30 03:02:47,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1522/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 9.548126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:47,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.65956 samples/s/p 3:05:00 } +2024-07-30 03:02:50,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1524/ 3125], loss: 0.348, per_step_time: 1413ms, lr: 9.54669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:50,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.66011 samples/s/p 3:04:56 } +2024-07-30 03:02:53,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1526/ 3125], loss: 0.343, per_step_time: 1415ms, lr: 9.545252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:53,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.65245 samples/s/p 3:05:08 } +2024-07-30 03:02:55,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1528/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 9.543812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:55,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.65813 samples/s/p 3:04:54 } +2024-07-30 03:02:58,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1530/ 3125], loss: 0.642, per_step_time: 1413ms, lr: 9.542368e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:02:58,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.65960 samples/s/p 3:04:49 } +2024-07-30 03:03:01,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1532/ 3125], loss: 0.652, per_step_time: 1414ms, lr: 9.540923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:01,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.65595 samples/s/p 3:04:53 } +2024-07-30 03:03:04,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1534/ 3125], loss: 0.135, per_step_time: 1414ms, lr: 9.539476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:04,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.65477 samples/s/p 3:04:52 } +2024-07-30 03:03:07,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1536/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 9.5380265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:07,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.65931 samples/s/p 3:04:41 } +2024-07-30 03:03:10,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1538/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 9.536576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:10,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.66068 samples/s/p 3:04:35 } +2024-07-30 03:03:12,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1540/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 9.5351215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:12,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.66029 samples/s/p 3:04:33 } +2024-07-30 03:03:15,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1542/ 3125], loss: 0.086, per_step_time: 1413ms, lr: 9.533665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:15,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.65954 samples/s/p 3:04:32 } +2024-07-30 03:03:18,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1544/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 9.532207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:18,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.66073 samples/s/p 3:04:27 } +2024-07-30 03:03:21,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1546/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 9.530747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:21,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.66100 samples/s/p 3:04:23 } +2024-07-30 03:03:24,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1548/ 3125], loss: 0.397, per_step_time: 1413ms, lr: 9.529285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:24,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.66024 samples/s/p 3:04:22 } +2024-07-30 03:03:27,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1550/ 3125], loss: 0.290, per_step_time: 1412ms, lr: 9.52782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:27,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.66289 samples/s/p 3:04:14 } +2024-07-30 03:03:29,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1552/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 9.526354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:29,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.65979 samples/s/p 3:04:17 } +2024-07-30 03:03:32,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1554/ 3125], loss: 0.239, per_step_time: 1414ms, lr: 9.524885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:32,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.65491 samples/s/p 3:04:24 } +2024-07-30 03:03:35,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1556/ 3125], loss: 0.274, per_step_time: 1412ms, lr: 9.5234145e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:35,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.66204 samples/s/p 3:04:07 } +2024-07-30 03:03:38,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1558/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 9.52194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:38,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.66063 samples/s/p 3:04:07 } +2024-07-30 03:03:41,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1560/ 3125], loss: 0.159, per_step_time: 1412ms, lr: 9.520465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:41,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.66199 samples/s/p 3:04:02 } +2024-07-30 03:03:44,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1562/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 9.518988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:44,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.66084 samples/s/p 3:04:01 } +2024-07-30 03:03:46,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1564/ 3125], loss: 0.299, per_step_time: 1414ms, lr: 9.517508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:46,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.65673 samples/s/p 3:04:06 } +2024-07-30 03:03:49,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1566/ 3125], loss: 0.421, per_step_time: 1414ms, lr: 9.516027e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:49,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.65662 samples/s/p 3:04:04 } +2024-07-30 03:03:52,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1568/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 9.514542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:52,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.65864 samples/s/p 3:03:57 } +2024-07-30 03:03:55,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1570/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 9.513056e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:55,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.65837 samples/s/p 3:03:54 } +2024-07-30 03:03:58,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1572/ 3125], loss: 0.147, per_step_time: 1414ms, lr: 9.511568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:03:58,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.65448 samples/s/p 3:03:59 } +2024-07-30 03:04:01,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1574/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 9.510079e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:01,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.65875 samples/s/p 3:03:48 } +2024-07-30 03:04:04,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1576/ 3125], loss: 0.207, per_step_time: 1425ms, lr: 9.508584e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:04,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.61177 samples/s/p 3:05:18 } +2024-07-30 03:04:06,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1578/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 9.50709e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:06,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.65968 samples/s/p 3:03:41 } +2024-07-30 03:04:09,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1580/ 3125], loss: 0.272, per_step_time: 1414ms, lr: 9.505594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:09,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.65744 samples/s/p 3:03:42 } +2024-07-30 03:04:12,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1582/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 9.504094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:12,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.66070 samples/s/p 3:03:33 } +2024-07-30 03:04:15,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1584/ 3125], loss: 0.315, per_step_time: 1414ms, lr: 9.5025935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:15,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.65624 samples/s/p 3:03:39 } +2024-07-30 03:04:18,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1586/ 3125], loss: 0.383, per_step_time: 1416ms, lr: 9.50109e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:18,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.64845 samples/s/p 3:03:51 } +2024-07-30 03:04:21,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1588/ 3125], loss: 0.414, per_step_time: 1414ms, lr: 9.499584e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:21,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.65738 samples/s/p 3:03:31 } +2024-07-30 03:04:23,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1590/ 3125], loss: 0.183, per_step_time: 1414ms, lr: 9.498076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:23,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.65524 samples/s/p 3:03:32 } +2024-07-30 03:04:26,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1592/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 9.496567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:26,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.65975 samples/s/p 3:03:21 } +2024-07-30 03:04:29,521 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1594/ 3125], loss: 0.227, per_step_time: 1414ms, lr: 9.495055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:29,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.65395 samples/s/p 3:03:29 } +2024-07-30 03:04:32,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1596/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 9.49354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:32,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.66016 samples/s/p 3:03:14 } +2024-07-30 03:04:35,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1598/ 3125], loss: 0.253, per_step_time: 1414ms, lr: 9.492024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:35,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.65445 samples/s/p 3:03:23 } +2024-07-30 03:04:38,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1600/ 3125], loss: 0.272, per_step_time: 1414ms, lr: 9.490506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:38,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.65567 samples/s/p 3:03:17 } +2024-07-30 03:04:40,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1602/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 9.488986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:40,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.66039 samples/s/p 3:03:05 } +2024-07-30 03:04:43,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1604/ 3125], loss: 0.450, per_step_time: 1412ms, lr: 9.487463e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:43,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.66333 samples/s/p 3:02:57 } +2024-07-30 03:04:46,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1606/ 3125], loss: 0.407, per_step_time: 1413ms, lr: 9.485938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:46,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.65983 samples/s/p 3:03:01 } +2024-07-30 03:04:49,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1608/ 3125], loss: 0.170, per_step_time: 1414ms, lr: 9.484411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:49,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.65650 samples/s/p 3:03:04 } +2024-07-30 03:04:52,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1610/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 9.482882e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:52,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.65848 samples/s/p 3:02:58 } +2024-07-30 03:04:55,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1612/ 3125], loss: 0.373, per_step_time: 1414ms, lr: 9.48135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:55,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.65746 samples/s/p 3:02:57 } +2024-07-30 03:04:57,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1614/ 3125], loss: 0.432, per_step_time: 1413ms, lr: 9.479818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:04:57,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.66157 samples/s/p 3:02:46 } +2024-07-30 03:05:00,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1616/ 3125], loss: 0.367, per_step_time: 1413ms, lr: 9.478282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:00,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.65916 samples/s/p 3:02:48 } +2024-07-30 03:05:03,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1618/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 9.476745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:03,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.66022 samples/s/p 3:02:43 } +2024-07-30 03:05:06,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1620/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 9.475205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:06,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.66158 samples/s/p 3:02:38 } +2024-07-30 03:05:09,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1622/ 3125], loss: 0.099, per_step_time: 1413ms, lr: 9.473662e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:09,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.66031 samples/s/p 3:02:37 } +2024-07-30 03:05:12,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1624/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 9.472118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:12,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.66140 samples/s/p 3:02:32 } +2024-07-30 03:05:14,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1626/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 9.470572e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:14,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.66150 samples/s/p 3:02:29 } +2024-07-30 03:05:17,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1628/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 9.469024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:17,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.66091 samples/s/p 3:02:28 } +2024-07-30 03:05:20,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1630/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 9.467472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:20,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.66168 samples/s/p 3:02:23 } +2024-07-30 03:05:23,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1632/ 3125], loss: 0.266, per_step_time: 1412ms, lr: 9.465921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:23,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.66333 samples/s/p 3:02:17 } +2024-07-30 03:05:26,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1634/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 9.4643665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:26,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.65827 samples/s/p 3:02:24 } +2024-07-30 03:05:29,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1636/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 9.4628085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:29,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.66121 samples/s/p 3:02:16 } +2024-07-30 03:05:31,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1638/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 9.46125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:31,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.66166 samples/s/p 3:02:12 } +2024-07-30 03:05:34,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1640/ 3125], loss: 0.387, per_step_time: 1413ms, lr: 9.459689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:34,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.65986 samples/s/p 3:02:13 } +2024-07-30 03:05:37,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1642/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 9.4581255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:37,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.65847 samples/s/p 3:02:12 } +2024-07-30 03:05:40,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1644/ 3125], loss: 0.134, per_step_time: 1415ms, lr: 9.45656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:40,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.65252 samples/s/p 3:02:21 } +2024-07-30 03:05:43,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1646/ 3125], loss: 0.243, per_step_time: 1414ms, lr: 9.454992e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:43,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.65593 samples/s/p 3:02:12 } +2024-07-30 03:05:46,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1648/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 9.453423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:46,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.65837 samples/s/p 3:02:04 } +2024-07-30 03:05:48,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1650/ 3125], loss: 0.204, per_step_time: 1415ms, lr: 9.451852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:48,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.65351 samples/s/p 3:02:11 } +2024-07-30 03:05:51,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1652/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 9.450278e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:51,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.65873 samples/s/p 3:01:58 } +2024-07-30 03:05:54,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1654/ 3125], loss: 0.242, per_step_time: 1412ms, lr: 9.448701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:54,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.66180 samples/s/p 3:01:49 } +2024-07-30 03:05:57,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1656/ 3125], loss: 0.512, per_step_time: 1413ms, lr: 9.447123e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:05:57,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.66102 samples/s/p 3:01:48 } +2024-07-30 03:06:00,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1658/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 9.445543e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:00,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.65939 samples/s/p 3:01:48 } +2024-07-30 03:06:03,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1660/ 3125], loss: 0.321, per_step_time: 1413ms, lr: 9.443961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:03,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.66141 samples/s/p 3:01:41 } +2024-07-30 03:06:05,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1662/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 9.442376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:05,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.66100 samples/s/p 3:01:39 } +2024-07-30 03:06:08,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1664/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 9.44079e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:08,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.65880 samples/s/p 3:01:41 } +2024-07-30 03:06:11,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1666/ 3125], loss: 0.313, per_step_time: 1412ms, lr: 9.439201e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:11,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.66365 samples/s/p 3:01:29 } +2024-07-30 03:06:14,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1668/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 9.43761e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:14,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.65940 samples/s/p 3:01:34 } +2024-07-30 03:06:17,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1670/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 9.436017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:17,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.66096 samples/s/p 3:01:28 } +2024-07-30 03:06:20,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1672/ 3125], loss: 0.287, per_step_time: 1414ms, lr: 9.434422e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:20,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.65621 samples/s/p 3:01:34 } +2024-07-30 03:06:22,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1674/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 9.432824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:22,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.65895 samples/s/p 3:01:26 } +2024-07-30 03:06:25,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1676/ 3125], loss: 0.317, per_step_time: 1412ms, lr: 9.431225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:25,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.66204 samples/s/p 3:01:18 } +2024-07-30 03:06:28,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1678/ 3125], loss: 0.519, per_step_time: 1413ms, lr: 9.429624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:28,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.65962 samples/s/p 3:01:19 } +2024-07-30 03:06:31,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1680/ 3125], loss: 0.228, per_step_time: 1414ms, lr: 9.42802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:31,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.65760 samples/s/p 3:01:20 } +2024-07-30 03:06:34,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1682/ 3125], loss: 0.395, per_step_time: 1414ms, lr: 9.426415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:34,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.65666 samples/s/p 3:01:19 } +2024-07-30 03:06:37,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1684/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 9.424806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:37,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |████████ | 5.65851 samples/s/p 3:01:13 } +2024-07-30 03:06:39,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1686/ 3125], loss: 0.527, per_step_time: 1413ms, lr: 9.423197e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:39,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |████████ | 5.66164 samples/s/p 3:01:04 } +2024-07-30 03:06:42,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1688/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 9.421586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:42,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.66007 samples/s/p 3:01:04 } +2024-07-30 03:06:45,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1690/ 3125], loss: 0.398, per_step_time: 1413ms, lr: 9.419971e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:45,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.65991 samples/s/p 3:01:02 } +2024-07-30 03:06:48,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1692/ 3125], loss: 0.388, per_step_time: 1413ms, lr: 9.418355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:48,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.66107 samples/s/p 3:00:57 } +2024-07-30 03:06:51,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1694/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 9.416737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:51,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.66029 samples/s/p 3:00:55 } +2024-07-30 03:06:54,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1696/ 3125], loss: 0.180, per_step_time: 1412ms, lr: 9.415116e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:54,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.66229 samples/s/p 3:00:49 } +2024-07-30 03:06:56,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1698/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 9.413494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:56,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.65862 samples/s/p 3:00:53 } +2024-07-30 03:06:59,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1700/ 3125], loss: 0.333, per_step_time: 1414ms, lr: 9.411869e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:06:59,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.65688 samples/s/p 3:00:54 } +2024-07-30 03:07:02,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1702/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 9.410242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:02,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.66049 samples/s/p 3:00:44 } +2024-07-30 03:07:05,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1704/ 3125], loss: 0.429, per_step_time: 1414ms, lr: 9.408614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:05,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.65645 samples/s/p 3:00:49 } +2024-07-30 03:07:08,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1706/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 9.406983e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:08,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.66087 samples/s/p 3:00:37 } +2024-07-30 03:07:11,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1708/ 3125], loss: 0.098, per_step_time: 1413ms, lr: 9.4053485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:11,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.65864 samples/s/p 3:00:39 } +2024-07-30 03:07:13,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1710/ 3125], loss: 0.097, per_step_time: 1413ms, lr: 9.403714e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:13,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.66050 samples/s/p 3:00:32 } +2024-07-30 03:07:16,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1712/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 9.402076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:16,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.66116 samples/s/p 3:00:28 } +2024-07-30 03:07:19,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1714/ 3125], loss: 0.400, per_step_time: 1413ms, lr: 9.400437e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:19,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.65984 samples/s/p 3:00:28 } +2024-07-30 03:07:22,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1716/ 3125], loss: 0.209, per_step_time: 1412ms, lr: 9.398796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:22,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.66207 samples/s/p 3:00:21 } +2024-07-30 03:07:25,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1718/ 3125], loss: 0.398, per_step_time: 1413ms, lr: 9.397152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:25,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.65995 samples/s/p 3:00:22 } +2024-07-30 03:07:28,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1720/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 9.395506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:28,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.65814 samples/s/p 3:00:23 } +2024-07-30 03:07:30,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1722/ 3125], loss: 0.214, per_step_time: 1414ms, lr: 9.393859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:30,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.65481 samples/s/p 3:00:26 } +2024-07-30 03:07:33,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1724/ 3125], loss: 0.141, per_step_time: 1414ms, lr: 9.392209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:33,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.65580 samples/s/p 3:00:22 } +2024-07-30 03:07:36,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1726/ 3125], loss: 0.149, per_step_time: 1417ms, lr: 9.390556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:36,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.64405 samples/s/p 3:00:41 } +2024-07-30 03:07:39,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1728/ 3125], loss: 0.275, per_step_time: 1414ms, lr: 9.388902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:39,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.65694 samples/s/p 3:00:14 } +2024-07-30 03:07:42,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1730/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 9.387246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:42,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.66107 samples/s/p 3:00:03 } +2024-07-30 03:07:45,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1732/ 3125], loss: 0.168, per_step_time: 1414ms, lr: 9.385587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:45,089 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.65652 samples/s/p 3:00:09 } +2024-07-30 03:07:47,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1734/ 3125], loss: 0.273, per_step_time: 1414ms, lr: 9.383927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:47,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.65565 samples/s/p 3:00:08 } +2024-07-30 03:07:50,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1736/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 9.382265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:50,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.66083 samples/s/p 2:59:55 } +2024-07-30 03:07:53,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1738/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 9.380601e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:53,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.65806 samples/s/p 2:59:58 } +2024-07-30 03:07:56,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1740/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 9.378934e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:56,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.65985 samples/s/p 2:59:51 } +2024-07-30 03:07:59,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1742/ 3125], loss: 0.164, per_step_time: 1414ms, lr: 9.377265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:07:59,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.65395 samples/s/p 3:00:00 } +2024-07-30 03:08:02,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1744/ 3125], loss: 0.365, per_step_time: 1412ms, lr: 9.375594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:02,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.66311 samples/s/p 2:59:39 } +2024-07-30 03:08:04,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1746/ 3125], loss: 0.208, per_step_time: 1412ms, lr: 9.373922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:04,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.66223 samples/s/p 2:59:38 } +2024-07-30 03:08:07,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1748/ 3125], loss: 0.301, per_step_time: 1414ms, lr: 9.3722465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:07,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.65658 samples/s/p 2:59:46 } +2024-07-30 03:08:10,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1750/ 3125], loss: 0.379, per_step_time: 1412ms, lr: 9.3705685e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:10,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.66183 samples/s/p 2:59:33 } +2024-07-30 03:08:13,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1752/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 9.3688905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:13,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.66111 samples/s/p 2:59:32 } +2024-07-30 03:08:16,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1754/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 9.367209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:16,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.66057 samples/s/p 2:59:30 } +2024-07-30 03:08:19,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1756/ 3125], loss: 0.423, per_step_time: 1413ms, lr: 9.365525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:19,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.65840 samples/s/p 2:59:31 } +2024-07-30 03:08:21,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1758/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 9.363841e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:21,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.66035 samples/s/p 2:59:25 } +2024-07-30 03:08:24,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1760/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 9.362153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:24,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.66092 samples/s/p 2:59:21 } +2024-07-30 03:08:27,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1762/ 3125], loss: 0.590, per_step_time: 1413ms, lr: 9.360463e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:27,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.65986 samples/s/p 2:59:20 } +2024-07-30 03:08:30,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1764/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 9.358771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:30,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.65875 samples/s/p 2:59:19 } +2024-07-30 03:08:33,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1766/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 9.357077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:33,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.65819 samples/s/p 2:59:18 } +2024-07-30 03:08:36,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1768/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 9.355382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:36,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.66161 samples/s/p 2:59:08 } +2024-07-30 03:08:38,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1770/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 9.353684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:38,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.66126 samples/s/p 2:59:06 } +2024-07-30 03:08:41,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1772/ 3125], loss: 0.327, per_step_time: 1412ms, lr: 9.351984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:41,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.66182 samples/s/p 2:59:02 } +2024-07-30 03:08:44,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1774/ 3125], loss: 0.134, per_step_time: 1413ms, lr: 9.350281e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:44,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.65924 samples/s/p 2:59:04 } +2024-07-30 03:08:47,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1776/ 3125], loss: 0.391, per_step_time: 1412ms, lr: 9.348578e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:47,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.66316 samples/s/p 2:58:54 } +2024-07-30 03:08:50,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1778/ 3125], loss: 0.383, per_step_time: 1413ms, lr: 9.346872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:50,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.66041 samples/s/p 2:58:57 } +2024-07-30 03:08:53,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1780/ 3125], loss: 0.366, per_step_time: 1412ms, lr: 9.345163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:53,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.66295 samples/s/p 2:58:49 } +2024-07-30 03:08:55,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1782/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 9.343452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:55,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.65964 samples/s/p 2:58:52 } +2024-07-30 03:08:58,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1784/ 3125], loss: 0.436, per_step_time: 1413ms, lr: 9.341739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:08:58,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.65933 samples/s/p 2:58:50 } +2024-07-30 03:09:01,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1786/ 3125], loss: 0.294, per_step_time: 1414ms, lr: 9.340025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:01,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.65634 samples/s/p 2:58:53 } +2024-07-30 03:09:04,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1788/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 9.338309e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:04,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.65888 samples/s/p 2:58:45 } +2024-07-30 03:09:07,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1790/ 3125], loss: 0.432, per_step_time: 1413ms, lr: 9.33659e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:07,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.65889 samples/s/p 2:58:42 } +2024-07-30 03:09:10,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1792/ 3125], loss: 0.356, per_step_time: 1413ms, lr: 9.334869e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:10,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.65785 samples/s/p 2:58:42 } +2024-07-30 03:09:12,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1794/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 9.333146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:12,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.65814 samples/s/p 2:58:38 } +2024-07-30 03:09:15,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1796/ 3125], loss: 0.225, per_step_time: 1414ms, lr: 9.331422e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:15,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.65690 samples/s/p 2:58:38 } +2024-07-30 03:09:18,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1798/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 9.329694e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:18,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.65824 samples/s/p 2:58:32 } +2024-07-30 03:09:21,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1800/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 9.327966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:21,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.65883 samples/s/p 2:58:28 } +2024-07-30 03:09:24,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1802/ 3125], loss: 0.242, per_step_time: 1414ms, lr: 9.326234e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:24,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.65575 samples/s/p 2:58:31 } +2024-07-30 03:09:27,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1804/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 9.324502e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:27,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.66130 samples/s/p 2:58:18 } +2024-07-30 03:09:29,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1806/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 9.322765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:29,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.65925 samples/s/p 2:58:19 } +2024-07-30 03:09:32,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1808/ 3125], loss: 0.160, per_step_time: 1413ms, lr: 9.321029e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:32,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.65859 samples/s/p 2:58:18 } +2024-07-30 03:09:35,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1810/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 9.319289e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:35,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.65980 samples/s/p 2:58:12 } +2024-07-30 03:09:38,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1812/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 9.317549e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:38,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.65960 samples/s/p 2:58:10 } +2024-07-30 03:09:41,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1814/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 9.315804e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:41,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.65999 samples/s/p 2:58:06 } +2024-07-30 03:09:44,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1816/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 9.314059e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:44,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.66071 samples/s/p 2:58:02 } +2024-07-30 03:09:46,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1818/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 9.312312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:46,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.65785 samples/s/p 2:58:05 } +2024-07-30 03:09:49,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1820/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 9.310561e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:49,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.66163 samples/s/p 2:57:55 } +2024-07-30 03:09:52,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1822/ 3125], loss: 0.357, per_step_time: 1412ms, lr: 9.30881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:52,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.66199 samples/s/p 2:57:51 } +2024-07-30 03:09:55,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1824/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 9.307057e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:55,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.66088 samples/s/p 2:57:51 } +2024-07-30 03:09:58,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1826/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 9.3053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:09:58,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.65929 samples/s/p 2:57:51 } +2024-07-30 03:10:01,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1828/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 9.303542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:01,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.66115 samples/s/p 2:57:44 } +2024-07-30 03:10:03,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1830/ 3125], loss: 0.334, per_step_time: 1413ms, lr: 9.3017825e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:03,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.65938 samples/s/p 2:57:45 } +2024-07-30 03:10:06,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1832/ 3125], loss: 0.160, per_step_time: 1414ms, lr: 9.300021e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:06,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.65582 samples/s/p 2:57:49 } +2024-07-30 03:10:09,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1834/ 3125], loss: 0.279, per_step_time: 1414ms, lr: 9.298256e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:09,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.65606 samples/s/p 2:57:46 } +2024-07-30 03:10:12,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1836/ 3125], loss: 0.311, per_step_time: 1412ms, lr: 9.296491e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:12,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.66174 samples/s/p 2:57:32 } +2024-07-30 03:10:15,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1838/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 9.294722e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:15,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.66114 samples/s/p 2:57:30 } +2024-07-30 03:10:18,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1840/ 3125], loss: 0.365, per_step_time: 1412ms, lr: 9.292952e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:18,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.66177 samples/s/p 2:57:26 } +2024-07-30 03:10:20,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1842/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 9.2911805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:20,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.66016 samples/s/p 2:57:27 } +2024-07-30 03:10:23,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1844/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 9.289406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:23,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.66114 samples/s/p 2:57:22 } +2024-07-30 03:10:26,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1846/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 9.28763e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:26,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.65874 samples/s/p 2:57:24 } +2024-07-30 03:10:29,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1848/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 9.285851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:29,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.66039 samples/s/p 2:57:18 } +2024-07-30 03:10:32,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1850/ 3125], loss: 0.507, per_step_time: 1413ms, lr: 9.28407e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:32,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.65900 samples/s/p 2:57:17 } +2024-07-30 03:10:35,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1852/ 3125], loss: 0.280, per_step_time: 1414ms, lr: 9.282288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:35,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.65624 samples/s/p 2:57:20 } +2024-07-30 03:10:37,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1854/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 9.280503e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:37,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.65813 samples/s/p 2:57:13 } +2024-07-30 03:10:40,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1856/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 9.278717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:40,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.66086 samples/s/p 2:57:05 } +2024-07-30 03:10:43,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1858/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 9.276928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:43,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.65834 samples/s/p 2:57:07 } +2024-07-30 03:10:46,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1860/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 9.275138e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:46,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.66086 samples/s/p 2:57:00 } +2024-07-30 03:10:49,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1862/ 3125], loss: 0.399, per_step_time: 1413ms, lr: 9.273345e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:49,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.66137 samples/s/p 2:56:56 } +2024-07-30 03:10:52,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1864/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 9.271551e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:52,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.66055 samples/s/p 2:56:55 } +2024-07-30 03:10:54,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1866/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 9.269754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:54,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.66024 samples/s/p 2:56:52 } +2024-07-30 03:10:57,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1868/ 3125], loss: 0.055, per_step_time: 1414ms, lr: 9.267955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:10:57,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.65554 samples/s/p 2:56:58 } +2024-07-30 03:11:00,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1870/ 3125], loss: 0.165, per_step_time: 1412ms, lr: 9.266154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:00,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.66180 samples/s/p 2:56:44 } +2024-07-30 03:11:03,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1872/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 9.264351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:03,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |█████████ | 5.65876 samples/s/p 2:56:47 } +2024-07-30 03:11:06,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1874/ 3125], loss: 0.366, per_step_time: 1414ms, lr: 9.262546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:06,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |█████████ | 5.65545 samples/s/p 2:56:50 } +2024-07-30 03:11:09,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1876/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 9.260739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:09,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.65882 samples/s/p 2:56:41 } +2024-07-30 03:11:11,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1878/ 3125], loss: 0.410, per_step_time: 1414ms, lr: 9.258931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:11,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.65470 samples/s/p 2:56:46 } +2024-07-30 03:11:14,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1880/ 3125], loss: 0.310, per_step_time: 1412ms, lr: 9.257119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:14,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.66208 samples/s/p 2:56:29 } +2024-07-30 03:11:17,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1882/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 9.255306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:17,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.65843 samples/s/p 2:56:33 } +2024-07-30 03:11:20,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1884/ 3125], loss: 0.320, per_step_time: 1416ms, lr: 9.253491e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:20,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.64743 samples/s/p 2:56:51 } +2024-07-30 03:11:23,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1886/ 3125], loss: 0.366, per_step_time: 1424ms, lr: 9.251674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:23,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.61424 samples/s/p 2:57:51 } +2024-07-30 03:11:26,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1888/ 3125], loss: 0.145, per_step_time: 1414ms, lr: 9.249855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:26,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.65677 samples/s/p 2:56:28 } +2024-07-30 03:11:29,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1890/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 9.248033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:29,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.66161 samples/s/p 2:56:16 } +2024-07-30 03:11:31,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1892/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 9.24621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:31,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.66042 samples/s/p 2:56:15 } +2024-07-30 03:11:34,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1894/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 9.244384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:34,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.66054 samples/s/p 2:56:12 } +2024-07-30 03:11:37,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1896/ 3125], loss: 0.125, per_step_time: 1413ms, lr: 9.242558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:37,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.66002 samples/s/p 2:56:10 } +2024-07-30 03:11:40,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1898/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 9.240728e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:40,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.65799 samples/s/p 2:56:11 } +2024-07-30 03:11:43,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1900/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 9.238896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:43,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.66140 samples/s/p 2:56:02 } +2024-07-30 03:11:46,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1902/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 9.237063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:46,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.65936 samples/s/p 2:56:03 } +2024-07-30 03:11:48,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1904/ 3125], loss: 0.442, per_step_time: 1413ms, lr: 9.235228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:48,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.65956 samples/s/p 2:56:00 } +2024-07-30 03:11:51,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1906/ 3125], loss: 0.151, per_step_time: 1412ms, lr: 9.233391e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:51,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.66239 samples/s/p 2:55:52 } +2024-07-30 03:11:54,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1908/ 3125], loss: 0.155, per_step_time: 1412ms, lr: 9.231551e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:54,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.66184 samples/s/p 2:55:50 } +2024-07-30 03:11:57,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1910/ 3125], loss: 0.381, per_step_time: 1413ms, lr: 9.22971e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:11:57,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.66009 samples/s/p 2:55:51 } +2024-07-30 03:12:00,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1912/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 9.227867e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:00,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.66103 samples/s/p 2:55:46 } +2024-07-30 03:12:03,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1914/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 9.226022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:03,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.65987 samples/s/p 2:55:45 } +2024-07-30 03:12:05,858 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1916/ 3125], loss: 0.279, per_step_time: 1412ms, lr: 9.2241735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:05,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.66261 samples/s/p 2:55:37 } +2024-07-30 03:12:08,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1918/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 9.222324e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:08,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.66003 samples/s/p 2:55:39 } +2024-07-30 03:12:11,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1920/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 9.220473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:11,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.66161 samples/s/p 2:55:34 } +2024-07-30 03:12:14,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1922/ 3125], loss: 0.172, per_step_time: 1414ms, lr: 9.218618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:14,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.65765 samples/s/p 2:55:38 } +2024-07-30 03:12:17,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1924/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 9.216764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:17,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.66152 samples/s/p 2:55:28 } +2024-07-30 03:12:20,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1926/ 3125], loss: 0.110, per_step_time: 1413ms, lr: 9.214905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:20,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.66071 samples/s/p 2:55:27 } +2024-07-30 03:12:22,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1928/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 9.213046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:22,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.65889 samples/s/p 2:55:27 } +2024-07-30 03:12:25,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1930/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 9.211185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:25,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.66081 samples/s/p 2:55:21 } +2024-07-30 03:12:28,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1932/ 3125], loss: 0.282, per_step_time: 1414ms, lr: 9.209321e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:28,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.65667 samples/s/p 2:55:26 } +2024-07-30 03:12:31,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1934/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 9.207456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:31,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.65969 samples/s/p 2:55:17 } +2024-07-30 03:12:34,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1936/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 9.205588e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:34,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.65906 samples/s/p 2:55:16 } +2024-07-30 03:12:37,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1938/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 9.203719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:37,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.66042 samples/s/p 2:55:10 } +2024-07-30 03:12:39,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1940/ 3125], loss: 0.444, per_step_time: 1414ms, lr: 9.201847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:39,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.65598 samples/s/p 2:55:16 } +2024-07-30 03:12:42,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1942/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 9.199974e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:42,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.65666 samples/s/p 2:55:12 } +2024-07-30 03:12:45,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1944/ 3125], loss: 0.240, per_step_time: 1412ms, lr: 9.198097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:45,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.66202 samples/s/p 2:54:59 } +2024-07-30 03:12:48,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1946/ 3125], loss: 0.379, per_step_time: 1413ms, lr: 9.19622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:48,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.65805 samples/s/p 2:55:03 } +2024-07-30 03:12:51,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1948/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 9.19434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:51,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.65919 samples/s/p 2:54:59 } +2024-07-30 03:12:54,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1950/ 3125], loss: 0.079, per_step_time: 1413ms, lr: 9.192459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:54,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.65868 samples/s/p 2:54:57 } +2024-07-30 03:12:56,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1952/ 3125], loss: 0.346, per_step_time: 1414ms, lr: 9.190576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:56,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.65628 samples/s/p 2:54:58 } +2024-07-30 03:12:59,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1954/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 9.18869e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:12:59,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.65821 samples/s/p 2:54:52 } +2024-07-30 03:13:02,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1956/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 9.186801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:02,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.66026 samples/s/p 2:54:45 } +2024-07-30 03:13:05,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1958/ 3125], loss: 0.354, per_step_time: 1412ms, lr: 9.184912e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:05,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.66328 samples/s/p 2:54:37 } +2024-07-30 03:13:08,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1960/ 3125], loss: 0.174, per_step_time: 1412ms, lr: 9.183021e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:08,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.66251 samples/s/p 2:54:35 } +2024-07-30 03:13:11,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1962/ 3125], loss: 0.341, per_step_time: 1414ms, lr: 9.181127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:11,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.65668 samples/s/p 2:54:43 } +2024-07-30 03:13:13,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1964/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 9.179231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:13,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.66020 samples/s/p 2:54:34 } +2024-07-30 03:13:16,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1966/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 9.1773345e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:16,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.66125 samples/s/p 2:54:29 } +2024-07-30 03:13:19,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1968/ 3125], loss: 0.075, per_step_time: 1413ms, lr: 9.175434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:19,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.65924 samples/s/p 2:54:30 } +2024-07-30 03:13:22,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1970/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 9.173533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:22,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.66080 samples/s/p 2:54:24 } +2024-07-30 03:13:25,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1972/ 3125], loss: 0.377, per_step_time: 1413ms, lr: 9.171628e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:25,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.66135 samples/s/p 2:54:21 } +2024-07-30 03:13:28,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1974/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 9.169723e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:28,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.66083 samples/s/p 2:54:19 } +2024-07-30 03:13:30,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1976/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 9.167815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:30,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.66096 samples/s/p 2:54:16 } +2024-07-30 03:13:33,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1978/ 3125], loss: 0.148, per_step_time: 1414ms, lr: 9.165906e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:33,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.65599 samples/s/p 2:54:22 } +2024-07-30 03:13:36,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1980/ 3125], loss: 0.399, per_step_time: 1413ms, lr: 9.163994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:36,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.66104 samples/s/p 2:54:10 } +2024-07-30 03:13:39,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1982/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 9.1620805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:39,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.65778 samples/s/p 2:54:13 } +2024-07-30 03:13:42,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1984/ 3125], loss: 0.318, per_step_time: 1412ms, lr: 9.160166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:42,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.66195 samples/s/p 2:54:03 } +2024-07-30 03:13:45,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1986/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 9.158248e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:45,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.66080 samples/s/p 2:54:02 } +2024-07-30 03:13:47,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1988/ 3125], loss: 0.280, per_step_time: 1412ms, lr: 9.156328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:47,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.66194 samples/s/p 2:53:57 } +2024-07-30 03:13:50,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1990/ 3125], loss: 0.410, per_step_time: 1413ms, lr: 9.154406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:50,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.66150 samples/s/p 2:53:55 } +2024-07-30 03:13:53,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1992/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 9.1524835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:53,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.66087 samples/s/p 2:53:53 } +2024-07-30 03:13:56,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1994/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 9.150557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:56,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.66029 samples/s/p 2:53:51 } +2024-07-30 03:13:59,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1996/ 3125], loss: 0.112, per_step_time: 1412ms, lr: 9.14863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:13:59,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.66178 samples/s/p 2:53:46 } +2024-07-30 03:14:02,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 1998/ 3125], loss: 0.251, per_step_time: 1412ms, lr: 9.1467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:02,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.66192 samples/s/p 2:53:43 } +2024-07-30 03:14:04,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2000/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 9.144769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:04,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.66008 samples/s/p 2:53:43 } +2024-07-30 03:14:07,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2002/ 3125], loss: 0.148, per_step_time: 1413ms, lr: 9.1428365e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:07,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.65847 samples/s/p 2:53:44 } +2024-07-30 03:14:10,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2004/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 9.140901e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:10,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.65995 samples/s/p 2:53:38 } +2024-07-30 03:14:13,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2006/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 9.138963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:13,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.66088 samples/s/p 2:53:33 } +2024-07-30 03:14:16,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2008/ 3125], loss: 0.285, per_step_time: 1415ms, lr: 9.137024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:16,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.65320 samples/s/p 2:53:45 } +2024-07-30 03:14:19,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2010/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 9.135083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:19,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.65983 samples/s/p 2:53:30 } +2024-07-30 03:14:21,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2012/ 3125], loss: 0.333, per_step_time: 1412ms, lr: 9.1331385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:21,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.66208 samples/s/p 2:53:23 } +2024-07-30 03:14:24,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2014/ 3125], loss: 0.167, per_step_time: 1414ms, lr: 9.131193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:24,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.65488 samples/s/p 2:53:33 } +2024-07-30 03:14:27,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2016/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 9.129246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:27,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.65886 samples/s/p 2:53:23 } +2024-07-30 03:14:30,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2018/ 3125], loss: 0.382, per_step_time: 1414ms, lr: 9.127297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:30,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.65589 samples/s/p 2:53:26 } +2024-07-30 03:14:33,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2020/ 3125], loss: 0.444, per_step_time: 1412ms, lr: 9.125346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:33,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.66270 samples/s/p 2:53:10 } +2024-07-30 03:14:36,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2022/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 9.123393e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:36,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.65920 samples/s/p 2:53:14 } +2024-07-30 03:14:38,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2024/ 3125], loss: 0.321, per_step_time: 1414ms, lr: 9.121438e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:38,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.65715 samples/s/p 2:53:15 } +2024-07-30 03:14:41,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2026/ 3125], loss: 0.168, per_step_time: 1414ms, lr: 9.119481e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:41,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.65715 samples/s/p 2:53:12 } +2024-07-30 03:14:44,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2028/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 9.117522e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:44,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.65861 samples/s/p 2:53:06 } +2024-07-30 03:14:47,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2030/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 9.11556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:47,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.66026 samples/s/p 2:53:01 } +2024-07-30 03:14:50,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2032/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 9.113598e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:50,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.65855 samples/s/p 2:53:01 } +2024-07-30 03:14:53,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2034/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 9.1116335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:53,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.65861 samples/s/p 2:52:58 } +2024-07-30 03:14:55,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2036/ 3125], loss: 0.398, per_step_time: 1413ms, lr: 9.109666e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:55,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.66057 samples/s/p 2:52:52 } +2024-07-30 03:14:58,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2038/ 3125], loss: 0.288, per_step_time: 1415ms, lr: 9.107697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:14:58,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.65105 samples/s/p 2:53:06 } +2024-07-30 03:15:01,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2040/ 3125], loss: 0.238, per_step_time: 1412ms, lr: 9.105726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:01,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.66287 samples/s/p 2:52:42 } +2024-07-30 03:15:04,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2042/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 9.103754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:04,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.66067 samples/s/p 2:52:43 } +2024-07-30 03:15:07,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2044/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 9.101778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:07,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.65982 samples/s/p 2:52:42 } +2024-07-30 03:15:10,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2046/ 3125], loss: 0.397, per_step_time: 1412ms, lr: 9.099802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:10,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.66193 samples/s/p 2:52:35 } +2024-07-30 03:15:12,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2048/ 3125], loss: 0.360, per_step_time: 1412ms, lr: 9.097823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:12,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.66181 samples/s/p 2:52:32 } +2024-07-30 03:15:15,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2050/ 3125], loss: 0.395, per_step_time: 1412ms, lr: 9.095843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:15,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.66173 samples/s/p 2:52:30 } +2024-07-30 03:15:18,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2052/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 9.09386e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:18,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.65852 samples/s/p 2:52:33 } +2024-07-30 03:15:21,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2054/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 9.091876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:21,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.66110 samples/s/p 2:52:25 } +2024-07-30 03:15:24,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2056/ 3125], loss: 0.190, per_step_time: 1412ms, lr: 9.089889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:24,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.66268 samples/s/p 2:52:19 } +2024-07-30 03:15:27,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2058/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 9.0879e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:27,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.66061 samples/s/p 2:52:20 } +2024-07-30 03:15:29,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2060/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 9.08591e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:29,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.65916 samples/s/p 2:52:20 } +2024-07-30 03:15:32,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2062/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 9.0839185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:32,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.66150 samples/s/p 2:52:13 } +2024-07-30 03:15:35,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2064/ 3125], loss: 0.192, per_step_time: 1414ms, lr: 9.081924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:35,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |███████████ | 5.65584 samples/s/p 2:52:21 } +2024-07-30 03:15:38,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2066/ 3125], loss: 0.354, per_step_time: 1414ms, lr: 9.079927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:38,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |███████████ | 5.65767 samples/s/p 2:52:15 } +2024-07-30 03:15:41,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2068/ 3125], loss: 0.349, per_step_time: 1414ms, lr: 9.0779295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:41,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.65707 samples/s/p 2:52:13 } +2024-07-30 03:15:44,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2070/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 9.0759295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:44,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.66105 samples/s/p 2:52:03 } +2024-07-30 03:15:46,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2072/ 3125], loss: 0.483, per_step_time: 1413ms, lr: 9.073927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:46,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.65974 samples/s/p 2:52:02 } +2024-07-30 03:15:49,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2074/ 3125], loss: 0.206, per_step_time: 1415ms, lr: 9.071923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:49,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.65365 samples/s/p 2:52:11 } +2024-07-30 03:15:52,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2076/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 9.069917e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:52,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.66123 samples/s/p 2:51:54 } +2024-07-30 03:15:55,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2078/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 9.06791e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:55,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.66108 samples/s/p 2:51:51 } +2024-07-30 03:15:58,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2080/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 9.0659e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:15:58,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.66162 samples/s/p 2:51:48 } +2024-07-30 03:16:01,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2082/ 3125], loss: 0.082, per_step_time: 1414ms, lr: 9.063888e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:01,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.65706 samples/s/p 2:51:53 } +2024-07-30 03:16:03,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2084/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 9.061873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:03,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.66022 samples/s/p 2:51:44 } +2024-07-30 03:16:06,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2086/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 9.059858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:06,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.66027 samples/s/p 2:51:41 } +2024-07-30 03:16:09,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2088/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 9.0578405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:09,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.65868 samples/s/p 2:51:42 } +2024-07-30 03:16:12,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2090/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 9.0558215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:12,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.66008 samples/s/p 2:51:36 } +2024-07-30 03:16:15,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2092/ 3125], loss: 0.397, per_step_time: 1413ms, lr: 9.0538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:15,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.66014 samples/s/p 2:51:33 } +2024-07-30 03:16:18,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2094/ 3125], loss: 0.323, per_step_time: 1413ms, lr: 9.051776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:18,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.66116 samples/s/p 2:51:29 } +2024-07-30 03:16:20,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2096/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 9.049751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:20,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.66092 samples/s/p 2:51:26 } +2024-07-30 03:16:23,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2098/ 3125], loss: 0.217, per_step_time: 1414ms, lr: 9.047724e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:23,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.65522 samples/s/p 2:51:34 } +2024-07-30 03:16:26,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2100/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 9.045693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:26,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.66017 samples/s/p 2:51:22 } +2024-07-30 03:16:29,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2102/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 9.043662e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:29,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.66050 samples/s/p 2:51:18 } +2024-07-30 03:16:32,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2104/ 3125], loss: 0.235, per_step_time: 1414ms, lr: 9.04163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:32,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.65532 samples/s/p 2:51:25 } +2024-07-30 03:16:35,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2106/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 9.039595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:35,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.66171 samples/s/p 2:51:11 } +2024-07-30 03:16:37,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2108/ 3125], loss: 0.154, per_step_time: 1414ms, lr: 9.037558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:37,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.65623 samples/s/p 2:51:18 } +2024-07-30 03:16:40,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2110/ 3125], loss: 0.134, per_step_time: 1412ms, lr: 9.035519e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:40,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.66246 samples/s/p 2:51:04 } +2024-07-30 03:16:43,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2112/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 9.033478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:43,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.65826 samples/s/p 2:51:08 } +2024-07-30 03:16:46,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2114/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 9.031435e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:46,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.65844 samples/s/p 2:51:05 } +2024-07-30 03:16:49,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2116/ 3125], loss: 0.236, per_step_time: 1412ms, lr: 9.029391e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:49,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.66315 samples/s/p 2:50:54 } +2024-07-30 03:16:52,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2118/ 3125], loss: 0.295, per_step_time: 1412ms, lr: 9.027343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:52,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.66211 samples/s/p 2:50:53 } +2024-07-30 03:16:54,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2120/ 3125], loss: 0.335, per_step_time: 1413ms, lr: 9.025296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:54,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.66112 samples/s/p 2:50:52 } +2024-07-30 03:16:57,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2122/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 9.023245e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:16:57,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.66164 samples/s/p 2:50:48 } +2024-07-30 03:17:00,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2124/ 3125], loss: 0.057, per_step_time: 1413ms, lr: 9.021193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:00,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.65959 samples/s/p 2:50:49 } +2024-07-30 03:17:03,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2126/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 9.019139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:03,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.66141 samples/s/p 2:50:43 } +2024-07-30 03:17:06,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2128/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 9.017082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:06,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.66013 samples/s/p 2:50:42 } +2024-07-30 03:17:09,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2130/ 3125], loss: 0.311, per_step_time: 1412ms, lr: 9.015024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:09,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.66233 samples/s/p 2:50:36 } +2024-07-30 03:17:11,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2132/ 3125], loss: 0.164, per_step_time: 1413ms, lr: 9.012964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:11,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.65987 samples/s/p 2:50:37 } +2024-07-30 03:17:14,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2134/ 3125], loss: 0.291, per_step_time: 1413ms, lr: 9.010902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:14,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.65788 samples/s/p 2:50:38 } +2024-07-30 03:17:17,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2136/ 3125], loss: 0.086, per_step_time: 1412ms, lr: 9.008838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:17,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.66218 samples/s/p 2:50:27 } +2024-07-30 03:17:20,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2138/ 3125], loss: 0.397, per_step_time: 1412ms, lr: 9.006773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:20,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.66202 samples/s/p 2:50:25 } +2024-07-30 03:17:23,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2140/ 3125], loss: 0.387, per_step_time: 1416ms, lr: 9.004705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:23,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.64890 samples/s/p 2:50:46 } +2024-07-30 03:17:26,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2142/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 9.002635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:26,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.65956 samples/s/p 2:50:24 } +2024-07-30 03:17:28,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2144/ 3125], loss: 0.336, per_step_time: 1414ms, lr: 9.000564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:28,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.65506 samples/s/p 2:50:29 } +2024-07-30 03:17:31,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2146/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 8.998491e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:31,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.66147 samples/s/p 2:50:15 } +2024-07-30 03:17:34,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2148/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 8.996415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:34,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.66018 samples/s/p 2:50:14 } +2024-07-30 03:17:37,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2150/ 3125], loss: 0.067, per_step_time: 1413ms, lr: 8.994339e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:37,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.66169 samples/s/p 2:50:08 } +2024-07-30 03:17:40,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2152/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 8.992258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:40,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.65972 samples/s/p 2:50:09 } +2024-07-30 03:17:43,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2154/ 3125], loss: 0.204, per_step_time: 1412ms, lr: 8.990178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:43,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.66238 samples/s/p 2:50:02 } +2024-07-30 03:17:45,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2156/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 8.988095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:45,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.65965 samples/s/p 2:50:04 } +2024-07-30 03:17:48,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2158/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 8.9860105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:48,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.65932 samples/s/p 2:50:01 } +2024-07-30 03:17:51,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2160/ 3125], loss: 0.406, per_step_time: 1412ms, lr: 8.983923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:51,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.66263 samples/s/p 2:49:53 } +2024-07-30 03:17:54,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2162/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 8.981835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:54,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.66077 samples/s/p 2:49:53 } +2024-07-30 03:17:57,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2164/ 3125], loss: 0.318, per_step_time: 1414ms, lr: 8.979744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:17:57,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.65656 samples/s/p 2:49:58 } +2024-07-30 03:18:00,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2166/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 8.977651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:00,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.66012 samples/s/p 2:49:49 } +2024-07-30 03:18:02,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2168/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 8.975558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:02,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.65936 samples/s/p 2:49:47 } +2024-07-30 03:18:05,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2170/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 8.973461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:05,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.65882 samples/s/p 2:49:45 } +2024-07-30 03:18:08,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2172/ 3125], loss: 0.114, per_step_time: 1413ms, lr: 8.971362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:08,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.65973 samples/s/p 2:49:41 } +2024-07-30 03:18:11,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2174/ 3125], loss: 0.497, per_step_time: 1413ms, lr: 8.969263e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:11,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.65813 samples/s/p 2:49:41 } +2024-07-30 03:18:14,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2176/ 3125], loss: 0.241, per_step_time: 1414ms, lr: 8.967161e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:14,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.65571 samples/s/p 2:49:42 } +2024-07-30 03:18:17,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2178/ 3125], loss: 0.211, per_step_time: 1414ms, lr: 8.9650575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:17,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.65682 samples/s/p 2:49:38 } +2024-07-30 03:18:19,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2180/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 8.962952e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:19,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.65836 samples/s/p 2:49:32 } +2024-07-30 03:18:22,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2182/ 3125], loss: 0.547, per_step_time: 1413ms, lr: 8.960844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:22,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.65943 samples/s/p 2:49:27 } +2024-07-30 03:18:25,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2184/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 8.958734e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:25,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.65795 samples/s/p 2:49:27 } +2024-07-30 03:18:28,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2186/ 3125], loss: 0.458, per_step_time: 1414ms, lr: 8.956623e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:28,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.65687 samples/s/p 2:49:26 } +2024-07-30 03:18:31,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2188/ 3125], loss: 0.372, per_step_time: 1414ms, lr: 8.954509e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:31,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.65693 samples/s/p 2:49:23 } +2024-07-30 03:18:34,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2190/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 8.952395e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:34,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.66077 samples/s/p 2:49:14 } +2024-07-30 03:18:36,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2192/ 3125], loss: 0.120, per_step_time: 1413ms, lr: 8.950277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:36,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.66066 samples/s/p 2:49:11 } +2024-07-30 03:18:39,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2194/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 8.948158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:39,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.66143 samples/s/p 2:49:07 } +2024-07-30 03:18:42,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2196/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 8.946038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:42,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.65998 samples/s/p 2:49:07 } +2024-07-30 03:18:45,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2198/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 8.943915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:45,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.65955 samples/s/p 2:49:04 } +2024-07-30 03:18:48,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2200/ 3125], loss: 0.220, per_step_time: 1412ms, lr: 8.94179e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:48,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.66217 samples/s/p 2:48:57 } +2024-07-30 03:18:51,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2202/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 8.939664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:51,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.66046 samples/s/p 2:48:57 } +2024-07-30 03:18:53,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2204/ 3125], loss: 0.249, per_step_time: 1415ms, lr: 8.937535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:53,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.65186 samples/s/p 2:49:10 } +2024-07-30 03:18:56,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2206/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 8.935404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:56,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.66150 samples/s/p 2:48:50 } +2024-07-30 03:18:59,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2208/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 8.9332725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:18:59,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.66144 samples/s/p 2:48:47 } +2024-07-30 03:19:02,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2210/ 3125], loss: 0.392, per_step_time: 1412ms, lr: 8.931139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:02,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.66384 samples/s/p 2:48:40 } +2024-07-30 03:19:05,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2212/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 8.929003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:05,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.65816 samples/s/p 2:48:47 } +2024-07-30 03:19:08,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2214/ 3125], loss: 0.446, per_step_time: 1413ms, lr: 8.926866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:08,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.66132 samples/s/p 2:48:39 } +2024-07-30 03:19:10,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2216/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 8.924726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:10,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.66056 samples/s/p 2:48:37 } +2024-07-30 03:19:13,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2218/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 8.922584e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:13,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.66136 samples/s/p 2:48:33 } +2024-07-30 03:19:16,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2220/ 3125], loss: 0.357, per_step_time: 1424ms, lr: 8.92044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:16,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.61441 samples/s/p 2:49:55 } +2024-07-30 03:19:19,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2222/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 8.918296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:19,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.65935 samples/s/p 2:48:31 } +2024-07-30 03:19:22,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2224/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 8.916148e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:22,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.66135 samples/s/p 2:48:25 } +2024-07-30 03:19:25,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2226/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 8.913999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:25,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.66166 samples/s/p 2:48:21 } +2024-07-30 03:19:27,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2228/ 3125], loss: 0.122, per_step_time: 1413ms, lr: 8.911848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:27,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.66078 samples/s/p 2:48:20 } +2024-07-30 03:19:30,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2230/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 8.909696e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:30,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.65932 samples/s/p 2:48:20 } +2024-07-30 03:19:33,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2232/ 3125], loss: 0.463, per_step_time: 1413ms, lr: 8.907542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:33,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.66071 samples/s/p 2:48:14 } +2024-07-30 03:19:36,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2234/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 8.905385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:36,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.65834 samples/s/p 2:48:16 } +2024-07-30 03:19:39,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2236/ 3125], loss: 0.187, per_step_time: 1416ms, lr: 8.903226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:39,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.64631 samples/s/p 2:48:34 } +2024-07-30 03:19:42,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2238/ 3125], loss: 0.119, per_step_time: 1414ms, lr: 8.901066e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:42,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.65706 samples/s/p 2:48:12 } +2024-07-30 03:19:45,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2240/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 8.8989045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:45,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.65907 samples/s/p 2:48:06 } +2024-07-30 03:19:47,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2242/ 3125], loss: 0.383, per_step_time: 1413ms, lr: 8.896741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:47,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.66003 samples/s/p 2:48:01 } +2024-07-30 03:19:50,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2244/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 8.894574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:50,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.66093 samples/s/p 2:47:57 } +2024-07-30 03:19:53,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2246/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 8.892407e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:53,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |███████████ | 5.65990 samples/s/p 2:47:56 } +2024-07-30 03:19:56,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2248/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 8.890238e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:56,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |███████████ | 5.66069 samples/s/p 2:47:52 } +2024-07-30 03:19:59,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2250/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 8.888067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:19:59,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.66089 samples/s/p 2:47:49 } +2024-07-30 03:20:02,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2252/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 8.885892e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:02,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.66104 samples/s/p 2:47:45 } +2024-07-30 03:20:04,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2254/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 8.883718e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:04,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.66055 samples/s/p 2:47:44 } +2024-07-30 03:20:07,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2256/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 8.881541e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:07,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.65971 samples/s/p 2:47:42 } +2024-07-30 03:20:10,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2258/ 3125], loss: 0.159, per_step_time: 1416ms, lr: 8.879362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:10,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.64879 samples/s/p 2:47:59 } +2024-07-30 03:20:13,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2260/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 8.877181e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:13,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.66029 samples/s/p 2:47:36 } +2024-07-30 03:20:16,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2262/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 8.874999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:16,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.66094 samples/s/p 2:47:32 } +2024-07-30 03:20:19,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2264/ 3125], loss: 0.264, per_step_time: 1414ms, lr: 8.872815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:19,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.65720 samples/s/p 2:47:35 } +2024-07-30 03:20:21,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2266/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 8.870629e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:21,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.65987 samples/s/p 2:47:28 } +2024-07-30 03:20:24,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2268/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.86844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:24,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.66145 samples/s/p 2:47:22 } +2024-07-30 03:20:27,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2270/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 8.86625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:27,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.66071 samples/s/p 2:47:21 } +2024-07-30 03:20:30,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2272/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 8.864059e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:30,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.65958 samples/s/p 2:47:20 } +2024-07-30 03:20:33,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2274/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 8.861865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:33,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.66167 samples/s/p 2:47:13 } +2024-07-30 03:20:36,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2276/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 8.85967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:36,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.66097 samples/s/p 2:47:12 } +2024-07-30 03:20:38,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2278/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 8.8574725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:38,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.65969 samples/s/p 2:47:11 } +2024-07-30 03:20:41,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2280/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 8.855273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:41,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.65873 samples/s/p 2:47:10 } +2024-07-30 03:20:44,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2282/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 8.853073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:44,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.66126 samples/s/p 2:47:03 } +2024-07-30 03:20:47,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2284/ 3125], loss: 0.197, per_step_time: 1414ms, lr: 8.85087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:47,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.65629 samples/s/p 2:47:09 } +2024-07-30 03:20:50,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2286/ 3125], loss: 0.174, per_step_time: 1414ms, lr: 8.848665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:50,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.65416 samples/s/p 2:47:10 } +2024-07-30 03:20:53,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2288/ 3125], loss: 0.229, per_step_time: 1412ms, lr: 8.8464585e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:53,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.66277 samples/s/p 2:46:52 } +2024-07-30 03:20:55,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2290/ 3125], loss: 0.239, per_step_time: 1412ms, lr: 8.84425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:55,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.66191 samples/s/p 2:46:50 } +2024-07-30 03:20:58,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2292/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 8.842041e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:20:58,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.65915 samples/s/p 2:46:52 } +2024-07-30 03:21:01,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2294/ 3125], loss: 0.151, per_step_time: 1414ms, lr: 8.839828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:01,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.65684 samples/s/p 2:46:54 } +2024-07-30 03:21:04,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2296/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 8.837615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:04,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.65778 samples/s/p 2:46:49 } +2024-07-30 03:21:07,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2298/ 3125], loss: 0.244, per_step_time: 1414ms, lr: 8.835399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:07,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.65501 samples/s/p 2:46:51 } +2024-07-30 03:21:10,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2300/ 3125], loss: 0.378, per_step_time: 1414ms, lr: 8.833182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:10,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.65452 samples/s/p 2:46:49 } +2024-07-30 03:21:12,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2302/ 3125], loss: 0.556, per_step_time: 1413ms, lr: 8.8309625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:12,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.65848 samples/s/p 2:46:39 } +2024-07-30 03:21:15,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2304/ 3125], loss: 0.383, per_step_time: 1413ms, lr: 8.828741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:15,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.65944 samples/s/p 2:46:35 } +2024-07-30 03:21:18,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2306/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 8.826519e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:18,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.65794 samples/s/p 2:46:35 } +2024-07-30 03:21:21,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2308/ 3125], loss: 0.211, per_step_time: 1415ms, lr: 8.824293e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:21,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.65344 samples/s/p 2:46:40 } +2024-07-30 03:21:24,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2310/ 3125], loss: 0.327, per_step_time: 1412ms, lr: 8.822068e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:24,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.66205 samples/s/p 2:46:22 } +2024-07-30 03:21:27,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2312/ 3125], loss: 0.224, per_step_time: 1416ms, lr: 8.8198385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:27,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.64962 samples/s/p 2:46:41 } +2024-07-30 03:21:29,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2314/ 3125], loss: 0.128, per_step_time: 1412ms, lr: 8.817608e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:29,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.66178 samples/s/p 2:46:17 } +2024-07-30 03:21:32,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2316/ 3125], loss: 0.142, per_step_time: 1412ms, lr: 8.8153765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:32,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.66274 samples/s/p 2:46:12 } +2024-07-30 03:21:35,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2318/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 8.813143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:35,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.65899 samples/s/p 2:46:16 } +2024-07-30 03:21:38,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2320/ 3125], loss: 0.192, per_step_time: 1412ms, lr: 8.810907e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:38,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.66285 samples/s/p 2:46:06 } +2024-07-30 03:21:41,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2322/ 3125], loss: 0.266, per_step_time: 1412ms, lr: 8.808669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:41,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.66178 samples/s/p 2:46:05 } +2024-07-30 03:21:44,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2324/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.80643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:44,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.66039 samples/s/p 2:46:05 } +2024-07-30 03:21:46,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2326/ 3125], loss: 0.665, per_step_time: 1413ms, lr: 8.804189e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:46,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.66043 samples/s/p 2:46:02 } +2024-07-30 03:21:49,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2328/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 8.801945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:49,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.65870 samples/s/p 2:46:02 } +2024-07-30 03:21:52,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2330/ 3125], loss: 0.517, per_step_time: 1413ms, lr: 8.7997005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:52,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.65902 samples/s/p 2:45:59 } +2024-07-30 03:21:55,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2332/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 8.797455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:55,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.65981 samples/s/p 2:45:55 } +2024-07-30 03:21:58,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2334/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 8.795207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:21:58,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.66060 samples/s/p 2:45:50 } +2024-07-30 03:22:01,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2336/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 8.792956e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:01,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.66056 samples/s/p 2:45:48 } +2024-07-30 03:22:03,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2338/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 8.790704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:03,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.66072 samples/s/p 2:45:45 } +2024-07-30 03:22:06,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2340/ 3125], loss: 0.059, per_step_time: 1413ms, lr: 8.788449e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:06,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.66142 samples/s/p 2:45:40 } +2024-07-30 03:22:09,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2342/ 3125], loss: 0.110, per_step_time: 1413ms, lr: 8.7861945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:09,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.66167 samples/s/p 2:45:37 } +2024-07-30 03:22:12,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2344/ 3125], loss: 0.222, per_step_time: 1412ms, lr: 8.783937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:12,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.66199 samples/s/p 2:45:34 } +2024-07-30 03:22:15,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2346/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 8.781677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:15,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.66125 samples/s/p 2:45:32 } +2024-07-30 03:22:18,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2348/ 3125], loss: 0.086, per_step_time: 1413ms, lr: 8.779416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:18,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.65878 samples/s/p 2:45:34 } +2024-07-30 03:22:20,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2350/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 8.777153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:20,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.65857 samples/s/p 2:45:31 } +2024-07-30 03:22:23,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2352/ 3125], loss: 0.291, per_step_time: 1412ms, lr: 8.774889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:23,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.66174 samples/s/p 2:45:23 } +2024-07-30 03:22:26,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2354/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 8.772622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:26,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.65841 samples/s/p 2:45:26 } +2024-07-30 03:22:29,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2356/ 3125], loss: 0.190, per_step_time: 1414ms, lr: 8.770355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:29,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.65762 samples/s/p 2:45:25 } +2024-07-30 03:22:32,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2358/ 3125], loss: 0.312, per_step_time: 1415ms, lr: 8.768084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:32,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.65223 samples/s/p 2:45:31 } +2024-07-30 03:22:35,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2360/ 3125], loss: 0.515, per_step_time: 1412ms, lr: 8.765812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:35,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.66257 samples/s/p 2:45:10 } +2024-07-30 03:22:37,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2362/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 8.763538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:37,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.65895 samples/s/p 2:45:14 } +2024-07-30 03:22:40,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2364/ 3125], loss: 0.183, per_step_time: 1418ms, lr: 8.7612625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:40,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.63883 samples/s/p 2:45:46 } +2024-07-30 03:22:43,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2366/ 3125], loss: 0.127, per_step_time: 1413ms, lr: 8.758985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:43,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.66054 samples/s/p 2:45:05 } +2024-07-30 03:22:46,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2368/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 8.756707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:46,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.65896 samples/s/p 2:45:05 } +2024-07-30 03:22:49,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2370/ 3125], loss: 0.141, per_step_time: 1413ms, lr: 8.754426e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:49,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.65968 samples/s/p 2:45:01 } +2024-07-30 03:22:52,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2372/ 3125], loss: 0.340, per_step_time: 1414ms, lr: 8.752143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:52,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.65545 samples/s/p 2:45:06 } +2024-07-30 03:22:54,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2374/ 3125], loss: 0.473, per_step_time: 1417ms, lr: 8.749858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:54,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.64428 samples/s/p 2:45:22 } +2024-07-30 03:22:57,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2376/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 8.747572e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:22:57,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.66037 samples/s/p 2:44:51 } +2024-07-30 03:23:00,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2378/ 3125], loss: 0.094, per_step_time: 1413ms, lr: 8.745284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:00,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.65845 samples/s/p 2:44:52 } +2024-07-30 03:23:03,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2380/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 8.7429935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:03,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.65834 samples/s/p 2:44:49 } +2024-07-30 03:23:06,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2382/ 3125], loss: 0.261, per_step_time: 1412ms, lr: 8.7407025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:06,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.66248 samples/s/p 2:44:39 } +2024-07-30 03:23:09,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2384/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 8.738409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:09,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.66058 samples/s/p 2:44:40 } +2024-07-30 03:23:11,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2386/ 3125], loss: 0.167, per_step_time: 1412ms, lr: 8.736114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:11,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.66223 samples/s/p 2:44:34 } +2024-07-30 03:23:14,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2388/ 3125], loss: 0.389, per_step_time: 1412ms, lr: 8.733817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:14,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.66230 samples/s/p 2:44:31 } +2024-07-30 03:23:17,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2390/ 3125], loss: 0.474, per_step_time: 1413ms, lr: 8.731518e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:17,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.66165 samples/s/p 2:44:29 } +2024-07-30 03:23:20,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2392/ 3125], loss: 0.226, per_step_time: 1412ms, lr: 8.729217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:20,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.66250 samples/s/p 2:44:25 } +2024-07-30 03:23:23,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2394/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 8.726915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:23,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.66022 samples/s/p 2:44:26 } +2024-07-30 03:23:26,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2396/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 8.724612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:26,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.65944 samples/s/p 2:44:25 } +2024-07-30 03:23:28,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2398/ 3125], loss: 0.353, per_step_time: 1413ms, lr: 8.722305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:28,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.66036 samples/s/p 2:44:20 } +2024-07-30 03:23:31,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2400/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 8.719997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:31,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.65809 samples/s/p 2:44:21 } +2024-07-30 03:23:34,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2402/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 8.717688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:34,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.65945 samples/s/p 2:44:16 } +2024-07-30 03:23:37,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2404/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 8.715378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:37,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.65995 samples/s/p 2:44:13 } +2024-07-30 03:23:40,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2406/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 8.713065e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:40,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.66088 samples/s/p 2:44:08 } +2024-07-30 03:23:43,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2408/ 3125], loss: 0.264, per_step_time: 1415ms, lr: 8.710749e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:43,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.65149 samples/s/p 2:44:22 } +2024-07-30 03:23:45,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2410/ 3125], loss: 0.300, per_step_time: 1412ms, lr: 8.708433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:45,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.66273 samples/s/p 2:43:59 } +2024-07-30 03:23:48,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2412/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 8.706115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:48,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.66092 samples/s/p 2:44:00 } +2024-07-30 03:23:51,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2414/ 3125], loss: 0.315, per_step_time: 1412ms, lr: 8.703795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:51,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.66267 samples/s/p 2:43:54 } +2024-07-30 03:23:54,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2416/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 8.701472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:54,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.66080 samples/s/p 2:43:54 } +2024-07-30 03:23:57,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2418/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 8.699149e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:23:57,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.66024 samples/s/p 2:43:52 } +2024-07-30 03:24:00,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2420/ 3125], loss: 0.363, per_step_time: 1413ms, lr: 8.696824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:00,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.66119 samples/s/p 2:43:48 } +2024-07-30 03:24:02,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2422/ 3125], loss: 0.210, per_step_time: 1415ms, lr: 8.694497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:02,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.65220 samples/s/p 2:44:01 } +2024-07-30 03:24:05,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2424/ 3125], loss: 0.583, per_step_time: 1413ms, lr: 8.692168e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:05,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.65861 samples/s/p 2:43:47 } +2024-07-30 03:24:08,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2426/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 8.689837e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:08,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.66142 samples/s/p 2:43:39 } +2024-07-30 03:24:11,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2428/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 8.687505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:11,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.66104 samples/s/p 2:43:37 } +2024-07-30 03:24:14,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2430/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 8.6851705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:14,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.66166 samples/s/p 2:43:33 } +2024-07-30 03:24:17,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2432/ 3125], loss: 0.409, per_step_time: 1415ms, lr: 8.682835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:17,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.65364 samples/s/p 2:43:44 } +2024-07-30 03:24:19,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2434/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 8.680497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:19,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |████████████ | 5.66162 samples/s/p 2:43:27 } +2024-07-30 03:24:22,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2436/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 8.678157e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:22,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |████████████ | 5.65929 samples/s/p 2:43:28 } +2024-07-30 03:24:25,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2438/ 3125], loss: 0.460, per_step_time: 1414ms, lr: 8.675816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:25,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.65486 samples/s/p 2:43:33 } +2024-07-30 03:24:28,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2440/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 8.6734735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:28,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.65961 samples/s/p 2:43:22 } +2024-07-30 03:24:31,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2442/ 3125], loss: 0.319, per_step_time: 1414ms, lr: 8.671129e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:31,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.65749 samples/s/p 2:43:23 } +2024-07-30 03:24:34,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2444/ 3125], loss: 0.472, per_step_time: 1413ms, lr: 8.668782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:34,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.66111 samples/s/p 2:43:14 } +2024-07-30 03:24:36,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2446/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 8.666434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:36,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.65822 samples/s/p 2:43:16 } +2024-07-30 03:24:39,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2448/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 8.664085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:39,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.66019 samples/s/p 2:43:10 } +2024-07-30 03:24:42,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2450/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 8.661733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:42,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.65935 samples/s/p 2:43:09 } +2024-07-30 03:24:45,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2452/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 8.659379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:45,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.65981 samples/s/p 2:43:05 } +2024-07-30 03:24:48,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2454/ 3125], loss: 0.155, per_step_time: 1414ms, lr: 8.6570235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:48,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.65530 samples/s/p 2:43:10 } +2024-07-30 03:24:51,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2456/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 8.654667e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:51,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.66155 samples/s/p 2:42:56 } +2024-07-30 03:24:53,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2458/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 8.652309e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:53,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.65894 samples/s/p 2:42:58 } +2024-07-30 03:24:56,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2460/ 3125], loss: 0.457, per_step_time: 1413ms, lr: 8.649948e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:56,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.66104 samples/s/p 2:42:52 } +2024-07-30 03:24:59,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2462/ 3125], loss: 0.426, per_step_time: 1413ms, lr: 8.647586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:24:59,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.65957 samples/s/p 2:42:51 } +2024-07-30 03:25:02,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2464/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 8.645222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:02,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.66136 samples/s/p 2:42:45 } +2024-07-30 03:25:05,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2466/ 3125], loss: 0.425, per_step_time: 1412ms, lr: 8.642855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:05,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.66283 samples/s/p 2:42:40 } +2024-07-30 03:25:08,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2468/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 8.640488e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:08,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.65841 samples/s/p 2:42:45 } +2024-07-30 03:25:10,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2470/ 3125], loss: 0.217, per_step_time: 1414ms, lr: 8.638119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:10,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.65710 samples/s/p 2:42:44 } +2024-07-30 03:25:13,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2472/ 3125], loss: 0.181, per_step_time: 1414ms, lr: 8.635749e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:13,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.65621 samples/s/p 2:42:43 } +2024-07-30 03:25:16,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2474/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 8.633376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:16,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.65907 samples/s/p 2:42:35 } +2024-07-30 03:25:19,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2476/ 3125], loss: 0.425, per_step_time: 1414ms, lr: 8.631002e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:19,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.65578 samples/s/p 2:42:38 } +2024-07-30 03:25:22,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2478/ 3125], loss: 0.303, per_step_time: 1414ms, lr: 8.628625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:22,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.65592 samples/s/p 2:42:35 } +2024-07-30 03:25:25,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2480/ 3125], loss: 0.207, per_step_time: 1412ms, lr: 8.626247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:25,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.66177 samples/s/p 2:42:22 } +2024-07-30 03:25:27,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2482/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 8.623868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:27,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.66004 samples/s/p 2:42:22 } +2024-07-30 03:25:30,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2484/ 3125], loss: 0.112, per_step_time: 1412ms, lr: 8.621487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:30,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.66254 samples/s/p 2:42:15 } +2024-07-30 03:25:33,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2486/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 8.619103e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:33,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.66093 samples/s/p 2:42:15 } +2024-07-30 03:25:36,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2488/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 8.616719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:36,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.66037 samples/s/p 2:42:13 } +2024-07-30 03:25:39,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2490/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 8.614333e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:39,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.65994 samples/s/p 2:42:11 } +2024-07-30 03:25:42,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2492/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 8.611944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:42,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.65786 samples/s/p 2:42:12 } +2024-07-30 03:25:44,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2494/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 8.609554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:44,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.65985 samples/s/p 2:42:06 } +2024-07-30 03:25:47,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2496/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 8.607162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:47,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.65999 samples/s/p 2:42:02 } +2024-07-30 03:25:50,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2498/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.6047685e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:50,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.65886 samples/s/p 2:42:02 } +2024-07-30 03:25:53,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2500/ 3125], loss: 0.103, per_step_time: 1413ms, lr: 8.602375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:53,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.66083 samples/s/p 2:41:55 } +2024-07-30 03:25:56,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2502/ 3125], loss: 0.338, per_step_time: 1414ms, lr: 8.599976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:56,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.65612 samples/s/p 2:42:01 } +2024-07-30 03:25:59,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2504/ 3125], loss: 0.336, per_step_time: 1414ms, lr: 8.597579e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:25:59,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.65748 samples/s/p 2:41:55 } +2024-07-30 03:26:01,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2506/ 3125], loss: 0.215, per_step_time: 1412ms, lr: 8.595178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:01,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.66184 samples/s/p 2:41:45 } +2024-07-30 03:26:04,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2508/ 3125], loss: 0.387, per_step_time: 1413ms, lr: 8.592777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:04,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.66123 samples/s/p 2:41:43 } +2024-07-30 03:26:07,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2510/ 3125], loss: 0.373, per_step_time: 1413ms, lr: 8.590373e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:07,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.66073 samples/s/p 2:41:41 } +2024-07-30 03:26:10,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2512/ 3125], loss: 0.230, per_step_time: 1416ms, lr: 8.587968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:10,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.64838 samples/s/p 2:42:00 } +2024-07-30 03:26:13,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2514/ 3125], loss: 0.258, per_step_time: 1414ms, lr: 8.58556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:13,310 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.65398 samples/s/p 2:41:47 } +2024-07-30 03:26:16,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2516/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 8.5831525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:16,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.66027 samples/s/p 2:41:34 } +2024-07-30 03:26:18,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2518/ 3125], loss: 0.340, per_step_time: 1414ms, lr: 8.580741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:18,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.65710 samples/s/p 2:41:36 } +2024-07-30 03:26:21,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2520/ 3125], loss: 0.080, per_step_time: 1413ms, lr: 8.578329e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:21,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.66009 samples/s/p 2:41:28 } +2024-07-30 03:26:24,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2522/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 8.575915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:24,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.65995 samples/s/p 2:41:26 } +2024-07-30 03:26:27,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2524/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 8.573499e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:27,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.65882 samples/s/p 2:41:25 } +2024-07-30 03:26:30,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2526/ 3125], loss: 0.306, per_step_time: 1412ms, lr: 8.571082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:30,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.66213 samples/s/p 2:41:16 } +2024-07-30 03:26:33,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2528/ 3125], loss: 0.300, per_step_time: 1414ms, lr: 8.568663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:33,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.65636 samples/s/p 2:41:23 } +2024-07-30 03:26:35,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2530/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 8.566242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:35,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.65913 samples/s/p 2:41:16 } +2024-07-30 03:26:38,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2532/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 8.563819e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:38,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.65981 samples/s/p 2:41:12 } +2024-07-30 03:26:41,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2534/ 3125], loss: 0.080, per_step_time: 1413ms, lr: 8.561396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:41,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.66072 samples/s/p 2:41:08 } +2024-07-30 03:26:44,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2536/ 3125], loss: 0.029, per_step_time: 1412ms, lr: 8.55897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:44,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.66267 samples/s/p 2:41:01 } +2024-07-30 03:26:47,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2538/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 8.556542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:47,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.66091 samples/s/p 2:41:02 } +2024-07-30 03:26:50,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2540/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 8.554112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:50,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.66056 samples/s/p 2:40:59 } +2024-07-30 03:26:52,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2542/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 8.551682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:52,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.66008 samples/s/p 2:40:57 } +2024-07-30 03:26:55,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2544/ 3125], loss: 0.513, per_step_time: 1412ms, lr: 8.549249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:55,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.66246 samples/s/p 2:40:50 } +2024-07-30 03:26:58,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2546/ 3125], loss: 0.527, per_step_time: 1413ms, lr: 8.546815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:26:58,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.65940 samples/s/p 2:40:53 } +2024-07-30 03:27:01,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2548/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 8.544379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:01,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.66117 samples/s/p 2:40:47 } +2024-07-30 03:27:04,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2550/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 8.541941e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:04,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.65892 samples/s/p 2:40:48 } +2024-07-30 03:27:07,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2552/ 3125], loss: 0.393, per_step_time: 1413ms, lr: 8.539501e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:07,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.65943 samples/s/p 2:40:44 } +2024-07-30 03:27:09,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2554/ 3125], loss: 0.224, per_step_time: 1412ms, lr: 8.537061e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:09,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.66215 samples/s/p 2:40:37 } +2024-07-30 03:27:12,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2556/ 3125], loss: 0.344, per_step_time: 1415ms, lr: 8.534618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:12,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.65357 samples/s/p 2:40:49 } +2024-07-30 03:27:15,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2558/ 3125], loss: 0.511, per_step_time: 1414ms, lr: 8.532173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:15,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.65544 samples/s/p 2:40:43 } +2024-07-30 03:27:18,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2560/ 3125], loss: 0.267, per_step_time: 1414ms, lr: 8.529727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:18,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.65665 samples/s/p 2:40:38 } +2024-07-30 03:27:21,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2562/ 3125], loss: 0.235, per_step_time: 1413ms, lr: 8.5272795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:21,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.65977 samples/s/p 2:40:30 } +2024-07-30 03:27:24,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2564/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 8.52483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:24,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.65925 samples/s/p 2:40:28 } +2024-07-30 03:27:26,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2566/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 8.522378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:26,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.65918 samples/s/p 2:40:25 } +2024-07-30 03:27:29,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2568/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 8.519925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:29,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.66116 samples/s/p 2:40:19 } +2024-07-30 03:27:32,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2570/ 3125], loss: 0.166, per_step_time: 1412ms, lr: 8.517471e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:32,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.66203 samples/s/p 2:40:14 } +2024-07-30 03:27:35,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2572/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 8.515014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:35,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.66000 samples/s/p 2:40:15 } +2024-07-30 03:27:38,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2574/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 8.512557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:38,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.65967 samples/s/p 2:40:13 } +2024-07-30 03:27:41,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2576/ 3125], loss: 0.606, per_step_time: 1414ms, lr: 8.510097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:41,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.65499 samples/s/p 2:40:18 } +2024-07-30 03:27:44,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2578/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 8.507635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:44,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.65889 samples/s/p 2:40:08 } +2024-07-30 03:27:46,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2580/ 3125], loss: 0.156, per_step_time: 1412ms, lr: 8.505172e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:46,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.66293 samples/s/p 2:39:59 } +2024-07-30 03:27:49,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2582/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 8.502709e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:49,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.66084 samples/s/p 2:39:59 } +2024-07-30 03:27:52,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2584/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 8.500242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:52,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.65899 samples/s/p 2:40:00 } +2024-07-30 03:27:55,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2586/ 3125], loss: 0.349, per_step_time: 1414ms, lr: 8.497773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:55,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.65723 samples/s/p 2:40:00 } +2024-07-30 03:27:58,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2588/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 8.495304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:27:58,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.66080 samples/s/p 2:39:51 } +2024-07-30 03:28:01,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2590/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 8.492833e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:01,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.65863 samples/s/p 2:39:52 } +2024-07-30 03:28:03,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2592/ 3125], loss: 0.391, per_step_time: 1412ms, lr: 8.4903595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:03,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.66213 samples/s/p 2:39:43 } +2024-07-30 03:28:06,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2594/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 8.487885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:06,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.66079 samples/s/p 2:39:43 } +2024-07-30 03:28:09,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2596/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.485409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:09,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.66160 samples/s/p 2:39:38 } +2024-07-30 03:28:12,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2598/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 8.482931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:12,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.66108 samples/s/p 2:39:36 } +2024-07-30 03:28:15,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2600/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 8.480451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:15,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.65953 samples/s/p 2:39:36 } +2024-07-30 03:28:18,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2602/ 3125], loss: 0.205, per_step_time: 1414ms, lr: 8.477969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:18,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.65619 samples/s/p 2:39:39 } +2024-07-30 03:28:20,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2604/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 8.4754865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:20,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.66008 samples/s/p 2:39:30 } +2024-07-30 03:28:23,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2606/ 3125], loss: 0.323, per_step_time: 1424ms, lr: 8.473002e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:23,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.61434 samples/s/p 2:40:45 } +2024-07-30 03:28:26,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2608/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 8.470515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:26,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.66119 samples/s/p 2:39:22 } +2024-07-30 03:28:29,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2610/ 3125], loss: 0.296, per_step_time: 1412ms, lr: 8.468027e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:29,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.66241 samples/s/p 2:39:17 } +2024-07-30 03:28:32,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2612/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 8.465538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:32,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.65803 samples/s/p 2:39:22 } +2024-07-30 03:28:35,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2614/ 3125], loss: 0.263, per_step_time: 1414ms, lr: 8.4630465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:35,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.65714 samples/s/p 2:39:21 } +2024-07-30 03:28:37,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2616/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 8.4605535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:37,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.65805 samples/s/p 2:39:16 } +2024-07-30 03:28:40,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2618/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 8.45806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:40,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.66142 samples/s/p 2:39:08 } +2024-07-30 03:28:43,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2620/ 3125], loss: 0.403, per_step_time: 1414ms, lr: 8.455562e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:43,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.65770 samples/s/p 2:39:11 } +2024-07-30 03:28:46,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2622/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 8.453065e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:46,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |█████████████ | 5.65825 samples/s/p 2:39:07 } +2024-07-30 03:28:49,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2624/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 8.4505655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:49,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |█████████████ | 5.66013 samples/s/p 2:39:01 } +2024-07-30 03:28:52,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2626/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 8.448064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:52,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.66089 samples/s/p 2:38:57 } +2024-07-30 03:28:54,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2628/ 3125], loss: 0.112, per_step_time: 1414ms, lr: 8.445561e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:54,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.65608 samples/s/p 2:39:03 } +2024-07-30 03:28:57,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2630/ 3125], loss: 0.297, per_step_time: 1412ms, lr: 8.443058e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:28:57,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.66175 samples/s/p 2:38:50 } +2024-07-30 03:29:00,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2632/ 3125], loss: 0.303, per_step_time: 1414ms, lr: 8.440551e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:00,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.65466 samples/s/p 2:38:59 } +2024-07-30 03:29:03,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2634/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.438044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:03,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.65968 samples/s/p 2:38:48 } +2024-07-30 03:29:06,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2636/ 3125], loss: 0.294, per_step_time: 1412ms, lr: 8.435534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:06,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.66296 samples/s/p 2:38:40 } +2024-07-30 03:29:09,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2638/ 3125], loss: 0.058, per_step_time: 1415ms, lr: 8.433022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:09,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.65111 samples/s/p 2:38:57 } +2024-07-30 03:29:11,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2640/ 3125], loss: 0.218, per_step_time: 1412ms, lr: 8.43051e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:11,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.66335 samples/s/p 2:38:33 } +2024-07-30 03:29:14,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2642/ 3125], loss: 0.335, per_step_time: 1413ms, lr: 8.427995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:14,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.66050 samples/s/p 2:38:35 } +2024-07-30 03:29:17,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2644/ 3125], loss: 0.282, per_step_time: 1416ms, lr: 8.425479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:17,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.64805 samples/s/p 2:38:53 } +2024-07-30 03:29:20,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2646/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 8.422962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:20,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.65871 samples/s/p 2:38:33 } +2024-07-30 03:29:23,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2648/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 8.420443e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:23,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.65893 samples/s/p 2:38:29 } +2024-07-30 03:29:26,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2650/ 3125], loss: 0.492, per_step_time: 1413ms, lr: 8.417922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:26,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.65781 samples/s/p 2:38:28 } +2024-07-30 03:29:28,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2652/ 3125], loss: 0.169, per_step_time: 1416ms, lr: 8.4154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:28,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.64747 samples/s/p 2:38:43 } +2024-07-30 03:29:31,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2654/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 8.412875e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:31,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.65850 samples/s/p 2:38:22 } +2024-07-30 03:29:34,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2656/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 8.410349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:34,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.66125 samples/s/p 2:38:14 } +2024-07-30 03:29:37,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2658/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 8.407823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:37,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.66072 samples/s/p 2:38:12 } +2024-07-30 03:29:40,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2660/ 3125], loss: 0.666, per_step_time: 1413ms, lr: 8.405293e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:40,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.66081 samples/s/p 2:38:09 } +2024-07-30 03:29:43,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2662/ 3125], loss: 0.224, per_step_time: 1414ms, lr: 8.402762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:43,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.65761 samples/s/p 2:38:12 } +2024-07-30 03:29:45,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2664/ 3125], loss: 0.433, per_step_time: 1413ms, lr: 8.40023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:45,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.65865 samples/s/p 2:38:07 } +2024-07-30 03:29:48,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2666/ 3125], loss: 0.185, per_step_time: 1414ms, lr: 8.397697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:48,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.65749 samples/s/p 2:38:06 } +2024-07-30 03:29:51,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2668/ 3125], loss: 0.216, per_step_time: 1414ms, lr: 8.395162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:51,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.65648 samples/s/p 2:38:05 } +2024-07-30 03:29:54,405 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2670/ 3125], loss: 0.426, per_step_time: 1413ms, lr: 8.392624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:54,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.65800 samples/s/p 2:38:00 } +2024-07-30 03:29:57,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2672/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 8.390086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:29:57,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.66051 samples/s/p 2:37:53 } +2024-07-30 03:30:00,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2674/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 8.387545e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:00,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.66101 samples/s/p 2:37:49 } +2024-07-30 03:30:02,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2676/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 8.385003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:02,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.66167 samples/s/p 2:37:45 } +2024-07-30 03:30:05,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2678/ 3125], loss: 0.156, per_step_time: 1414ms, lr: 8.38246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:05,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.65722 samples/s/p 2:37:50 } +2024-07-30 03:30:08,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2680/ 3125], loss: 0.206, per_step_time: 1412ms, lr: 8.379913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:08,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.66276 samples/s/p 2:37:38 } +2024-07-30 03:30:11,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2682/ 3125], loss: 0.554, per_step_time: 1413ms, lr: 8.377367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:11,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.66134 samples/s/p 2:37:37 } +2024-07-30 03:30:14,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2684/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 8.374818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:14,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.66005 samples/s/p 2:37:37 } +2024-07-30 03:30:17,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2686/ 3125], loss: 0.182, per_step_time: 1412ms, lr: 8.372269e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:17,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.66201 samples/s/p 2:37:31 } +2024-07-30 03:30:19,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2688/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 8.369716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:19,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.66017 samples/s/p 2:37:31 } +2024-07-30 03:30:22,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2690/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 8.367164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:22,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.65786 samples/s/p 2:37:32 } +2024-07-30 03:30:25,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2692/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 8.364609e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:25,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.65987 samples/s/p 2:37:26 } +2024-07-30 03:30:28,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2694/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 8.3620525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:28,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.66030 samples/s/p 2:37:22 } +2024-07-30 03:30:31,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2696/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 8.359494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:31,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.66006 samples/s/p 2:37:20 } +2024-07-30 03:30:34,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2698/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 8.356935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:34,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.65890 samples/s/p 2:37:19 } +2024-07-30 03:30:36,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2700/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 8.354374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:36,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.65917 samples/s/p 2:37:16 } +2024-07-30 03:30:39,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2702/ 3125], loss: 0.419, per_step_time: 1414ms, lr: 8.351811e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:39,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.65700 samples/s/p 2:37:16 } +2024-07-30 03:30:42,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2704/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 8.349247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:42,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.66079 samples/s/p 2:37:07 } +2024-07-30 03:30:45,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2706/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 8.34668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:45,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.66153 samples/s/p 2:37:03 } +2024-07-30 03:30:48,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2708/ 3125], loss: 0.245, per_step_time: 1417ms, lr: 8.344113e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:48,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.64450 samples/s/p 2:37:29 } +2024-07-30 03:30:51,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2710/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 8.3415425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:51,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.65924 samples/s/p 2:37:01 } +2024-07-30 03:30:53,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2712/ 3125], loss: 0.291, per_step_time: 1413ms, lr: 8.338972e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:53,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.65855 samples/s/p 2:37:00 } +2024-07-30 03:30:56,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2714/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 8.336399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:56,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.65974 samples/s/p 2:36:55 } +2024-07-30 03:30:59,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2716/ 3125], loss: 0.380, per_step_time: 1414ms, lr: 8.3338255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:30:59,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.65530 samples/s/p 2:36:59 } +2024-07-30 03:31:02,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2718/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 8.33125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:02,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.65640 samples/s/p 2:36:55 } +2024-07-30 03:31:05,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2720/ 3125], loss: 0.154, per_step_time: 1415ms, lr: 8.328672e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:05,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.65159 samples/s/p 2:37:00 } +2024-07-30 03:31:08,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2722/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 8.326094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:08,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.65945 samples/s/p 2:36:44 } +2024-07-30 03:31:10,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2724/ 3125], loss: 0.192, per_step_time: 1412ms, lr: 8.323513e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:10,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.66303 samples/s/p 2:36:35 } +2024-07-30 03:31:13,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2726/ 3125], loss: 0.214, per_step_time: 1412ms, lr: 8.320931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:13,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.66256 samples/s/p 2:36:33 } +2024-07-30 03:31:16,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2728/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 8.318348e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:16,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.66052 samples/s/p 2:36:34 } +2024-07-30 03:31:19,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2730/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 8.315763e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:19,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.66152 samples/s/p 2:36:29 } +2024-07-30 03:31:22,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2732/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 8.313175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:22,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.66059 samples/s/p 2:36:28 } +2024-07-30 03:31:25,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2734/ 3125], loss: 0.185, per_step_time: 1412ms, lr: 8.310587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:25,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.66247 samples/s/p 2:36:22 } +2024-07-30 03:31:27,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2736/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 8.307998e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:27,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.65898 samples/s/p 2:36:25 } +2024-07-30 03:31:30,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2738/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 8.3054065e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:30,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.66024 samples/s/p 2:36:20 } +2024-07-30 03:31:33,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2740/ 3125], loss: 0.346, per_step_time: 1416ms, lr: 8.3028135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:33,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.64676 samples/s/p 2:36:40 } +2024-07-30 03:31:36,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2742/ 3125], loss: 0.103, per_step_time: 1413ms, lr: 8.300218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:36,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.65823 samples/s/p 2:36:18 } +2024-07-30 03:31:39,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2744/ 3125], loss: 0.310, per_step_time: 1416ms, lr: 8.297622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:39,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.64626 samples/s/p 2:36:35 } +2024-07-30 03:31:42,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2746/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 8.295025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:42,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.65939 samples/s/p 2:36:10 } +2024-07-30 03:31:44,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2748/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 8.292424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:44,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.65971 samples/s/p 2:36:07 } +2024-07-30 03:31:47,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2750/ 3125], loss: 0.223, per_step_time: 1414ms, lr: 8.289823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:47,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.65653 samples/s/p 2:36:09 } +2024-07-30 03:31:50,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2752/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 8.287221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:50,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.65871 samples/s/p 2:36:03 } +2024-07-30 03:31:53,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2754/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 8.284617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:53,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.66017 samples/s/p 2:35:58 } +2024-07-30 03:31:56,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2756/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 8.282012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:56,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.65881 samples/s/p 2:35:57 } +2024-07-30 03:31:59,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2758/ 3125], loss: 0.384, per_step_time: 1413ms, lr: 8.279404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:31:59,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.65994 samples/s/p 2:35:52 } +2024-07-30 03:32:01,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2760/ 3125], loss: 0.341, per_step_time: 1412ms, lr: 8.276795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:01,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.66298 samples/s/p 2:35:44 } +2024-07-30 03:32:04,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2762/ 3125], loss: 0.064, per_step_time: 1412ms, lr: 8.274184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:04,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.66205 samples/s/p 2:35:43 } +2024-07-30 03:32:07,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2764/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 8.271573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:07,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.65832 samples/s/p 2:35:46 } +2024-07-30 03:32:10,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2766/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 8.26896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:10,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.66090 samples/s/p 2:35:39 } +2024-07-30 03:32:13,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2768/ 3125], loss: 0.217, per_step_time: 1414ms, lr: 8.266344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:13,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.65464 samples/s/p 2:35:47 } +2024-07-30 03:32:16,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2770/ 3125], loss: 0.292, per_step_time: 1417ms, lr: 8.263728e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:16,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.64506 samples/s/p 2:36:00 } +2024-07-30 03:32:18,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2772/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 8.2611095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:18,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.65820 samples/s/p 2:35:35 } +2024-07-30 03:32:21,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2774/ 3125], loss: 0.234, per_step_time: 1416ms, lr: 8.25849e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:21,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.64732 samples/s/p 2:35:50 } +2024-07-30 03:32:24,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2776/ 3125], loss: 0.142, per_step_time: 1413ms, lr: 8.255868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:24,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.65896 samples/s/p 2:35:28 } +2024-07-30 03:32:27,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2778/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 8.253245e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:27,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.65976 samples/s/p 2:35:24 } +2024-07-30 03:32:30,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2780/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 8.250621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:30,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.66160 samples/s/p 2:35:18 } +2024-07-30 03:32:33,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2782/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 8.2479955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:33,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.65960 samples/s/p 2:35:19 } +2024-07-30 03:32:35,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2784/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 8.245368e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:35,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.66094 samples/s/p 2:35:14 } +2024-07-30 03:32:38,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2786/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 8.242739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:38,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.65964 samples/s/p 2:35:13 } +2024-07-30 03:32:41,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2788/ 3125], loss: 0.381, per_step_time: 1413ms, lr: 8.240108e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:41,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.65942 samples/s/p 2:35:11 } +2024-07-30 03:32:44,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2790/ 3125], loss: 0.280, per_step_time: 1412ms, lr: 8.237476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:44,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.66190 samples/s/p 2:35:04 } +2024-07-30 03:32:47,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2792/ 3125], loss: 0.209, per_step_time: 1414ms, lr: 8.234842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:47,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.65658 samples/s/p 2:35:10 } +2024-07-30 03:32:50,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2794/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 8.2322085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:50,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.65842 samples/s/p 2:35:04 } +2024-07-30 03:32:52,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2796/ 3125], loss: 0.398, per_step_time: 1412ms, lr: 8.22957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:52,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.66380 samples/s/p 2:34:52 } +2024-07-30 03:32:55,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2798/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 8.226932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:55,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.66064 samples/s/p 2:34:55 } +2024-07-30 03:32:58,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2800/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 8.224293e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:32:58,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.65791 samples/s/p 2:34:56 } +2024-07-30 03:32:58,651 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 03:33:33,660 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2802/ 3125], loss: 0.252, per_step_time: 2057ms, lr: 8.221651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:33,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 3.88778 samples/s/p 3:45:25 } +2024-07-30 03:33:36,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2804/ 3125], loss: 0.293, per_step_time: 1413ms, lr: 8.219007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:36,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.65837 samples/s/p 2:34:50 } +2024-07-30 03:33:39,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2806/ 3125], loss: 0.327, per_step_time: 1413ms, lr: 8.216363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:39,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.66132 samples/s/p 2:34:42 } +2024-07-30 03:33:42,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2808/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 8.213718e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:42,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.66010 samples/s/p 2:34:41 } +2024-07-30 03:33:44,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2810/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 8.211069e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:44,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.65961 samples/s/p 2:34:39 } +2024-07-30 03:33:47,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2812/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 8.208421e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:47,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.65848 samples/s/p 2:34:38 } +2024-07-30 03:33:50,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2814/ 3125], loss: 0.436, per_step_time: 1413ms, lr: 8.20577e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:50,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |███████████████ | 5.66074 samples/s/p 2:34:32 } +2024-07-30 03:33:53,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2816/ 3125], loss: 0.281, per_step_time: 1414ms, lr: 8.203118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:53,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |███████████████ | 5.65711 samples/s/p 2:34:35 } +2024-07-30 03:33:56,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2818/ 3125], loss: 0.163, per_step_time: 1416ms, lr: 8.200464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:56,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.64755 samples/s/p 2:34:48 } +2024-07-30 03:33:59,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2820/ 3125], loss: 0.291, per_step_time: 1412ms, lr: 8.19781e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:33:59,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.66257 samples/s/p 2:34:20 } +2024-07-30 03:34:02,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2822/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 8.195152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:02,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.66056 samples/s/p 2:34:21 } +2024-07-30 03:34:04,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2824/ 3125], loss: 0.480, per_step_time: 1412ms, lr: 8.1924945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:04,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.66312 samples/s/p 2:34:14 } +2024-07-30 03:34:07,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2826/ 3125], loss: 0.451, per_step_time: 1421ms, lr: 8.189835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:07,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.62788 samples/s/p 2:35:09 } +2024-07-30 03:34:10,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2828/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 8.187173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:10,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.65811 samples/s/p 2:34:16 } +2024-07-30 03:34:13,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2830/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 8.184512e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:13,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.66004 samples/s/p 2:34:10 } +2024-07-30 03:34:16,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2832/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 8.181846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:16,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.65894 samples/s/p 2:34:09 } +2024-07-30 03:34:19,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2834/ 3125], loss: 0.295, per_step_time: 1415ms, lr: 8.17918e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:19,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.65307 samples/s/p 2:34:16 } +2024-07-30 03:34:21,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2836/ 3125], loss: 0.293, per_step_time: 1412ms, lr: 8.176514e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:21,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.66204 samples/s/p 2:33:59 } +2024-07-30 03:34:24,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2838/ 3125], loss: 0.379, per_step_time: 1413ms, lr: 8.1738435e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:24,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.65865 samples/s/p 2:34:01 } +2024-07-30 03:34:27,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2840/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 8.171173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:27,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.65996 samples/s/p 2:33:56 } +2024-07-30 03:34:30,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2842/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 8.168502e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:30,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.65880 samples/s/p 2:33:55 } +2024-07-30 03:34:33,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2844/ 3125], loss: 0.376, per_step_time: 1413ms, lr: 8.165828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:33,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.66106 samples/s/p 2:33:49 } +2024-07-30 03:34:36,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2846/ 3125], loss: 0.265, per_step_time: 1414ms, lr: 8.163152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:36,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.65465 samples/s/p 2:33:57 } +2024-07-30 03:34:38,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2848/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 8.160477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:38,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.65995 samples/s/p 2:33:45 } +2024-07-30 03:34:41,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2850/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 8.157799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:41,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.65883 samples/s/p 2:33:44 } +2024-07-30 03:34:44,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2852/ 3125], loss: 0.294, per_step_time: 1424ms, lr: 8.155119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:44,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.61443 samples/s/p 2:34:54 } +2024-07-30 03:34:47,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2854/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 8.152439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:47,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.66120 samples/s/p 2:33:35 } +2024-07-30 03:34:50,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2856/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 8.149756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:50,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.66108 samples/s/p 2:33:32 } +2024-07-30 03:34:53,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2858/ 3125], loss: 0.276, per_step_time: 1414ms, lr: 8.147072e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:53,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.65550 samples/s/p 2:33:38 } +2024-07-30 03:34:55,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2860/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 8.144387e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:55,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.65878 samples/s/p 2:33:30 } +2024-07-30 03:34:58,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2862/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 8.1417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:34:58,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.66009 samples/s/p 2:33:25 } +2024-07-30 03:35:01,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2864/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 8.139012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:01,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.65989 samples/s/p 2:33:22 } +2024-07-30 03:35:04,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2866/ 3125], loss: 0.137, per_step_time: 1414ms, lr: 8.1363205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:04,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.65486 samples/s/p 2:33:28 } +2024-07-30 03:35:07,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2868/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 8.133629e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:07,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.66062 samples/s/p 2:33:16 } +2024-07-30 03:35:10,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2870/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 8.130936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:10,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.66029 samples/s/p 2:33:13 } +2024-07-30 03:35:13,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2872/ 3125], loss: 0.205, per_step_time: 1417ms, lr: 8.1282415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:13,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.64515 samples/s/p 2:33:35 } +2024-07-30 03:35:16,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2874/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 8.125546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:16,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.65876 samples/s/p 2:33:10 } +2024-07-30 03:35:19,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2876/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 8.122848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:19,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.65884 samples/s/p 2:33:07 } +2024-07-30 03:35:21,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2878/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 8.12015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:21,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.65973 samples/s/p 2:33:03 } +2024-07-30 03:35:24,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2880/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 8.117449e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:24,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.66030 samples/s/p 2:32:59 } +2024-07-30 03:35:27,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2882/ 3125], loss: 0.242, per_step_time: 1414ms, lr: 8.114746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:27,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.65709 samples/s/p 2:33:02 } +2024-07-30 03:35:30,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2884/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 8.112043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:30,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.65913 samples/s/p 2:32:55 } +2024-07-30 03:35:33,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2886/ 3125], loss: 0.262, per_step_time: 1416ms, lr: 8.109339e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:33,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.64902 samples/s/p 2:33:09 } +2024-07-30 03:35:36,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2888/ 3125], loss: 0.190, per_step_time: 1412ms, lr: 8.106633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:36,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.66185 samples/s/p 2:32:45 } +2024-07-30 03:35:38,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2890/ 3125], loss: 0.192, per_step_time: 1414ms, lr: 8.103924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:38,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.65748 samples/s/p 2:32:50 } +2024-07-30 03:35:41,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2892/ 3125], loss: 0.357, per_step_time: 1414ms, lr: 8.101215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:41,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.65651 samples/s/p 2:32:48 } +2024-07-30 03:35:44,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2894/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 8.098505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:44,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.66038 samples/s/p 2:32:39 } +2024-07-30 03:35:47,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2896/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 8.0957925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:47,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.65801 samples/s/p 2:32:40 } +2024-07-30 03:35:50,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2898/ 3125], loss: 0.418, per_step_time: 1413ms, lr: 8.0930795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:50,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.66014 samples/s/p 2:32:34 } +2024-07-30 03:35:53,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2900/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 8.090362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:53,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.66074 samples/s/p 2:32:30 } +2024-07-30 03:35:55,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2902/ 3125], loss: 0.190, per_step_time: 1414ms, lr: 8.087645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:55,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.65474 samples/s/p 2:32:37 } +2024-07-30 03:35:58,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2904/ 3125], loss: 0.252, per_step_time: 1415ms, lr: 8.084929e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:35:58,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.65137 samples/s/p 2:32:40 } +2024-07-30 03:36:01,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2906/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 8.082207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:01,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.66143 samples/s/p 2:32:21 } +2024-07-30 03:36:04,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2908/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 8.079487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:04,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.65985 samples/s/p 2:32:20 } +2024-07-30 03:36:07,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2910/ 3125], loss: 0.122, per_step_time: 1413ms, lr: 8.076764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:07,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.65849 samples/s/p 2:32:20 } +2024-07-30 03:36:10,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2912/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 8.07404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:10,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.66054 samples/s/p 2:32:14 } +2024-07-30 03:36:13,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2914/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 8.071315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:13,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.65965 samples/s/p 2:32:12 } +2024-07-30 03:36:15,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2916/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 8.068589e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:15,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.66048 samples/s/p 2:32:08 } +2024-07-30 03:36:18,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2918/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 8.065859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:18,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.65772 samples/s/p 2:32:10 } +2024-07-30 03:36:21,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2920/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 8.063129e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:21,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.66141 samples/s/p 2:32:01 } +2024-07-30 03:36:24,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2922/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 8.060398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:24,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.66018 samples/s/p 2:32:00 } +2024-07-30 03:36:27,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2924/ 3125], loss: 0.187, per_step_time: 1414ms, lr: 8.057666e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:27,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.65615 samples/s/p 2:32:04 } +2024-07-30 03:36:30,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2926/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 8.05493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:30,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.66142 samples/s/p 2:31:52 } +2024-07-30 03:36:32,840 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2928/ 3125], loss: 0.356, per_step_time: 1413ms, lr: 8.052194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:32,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.65771 samples/s/p 2:31:56 } +2024-07-30 03:36:35,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2930/ 3125], loss: 0.226, per_step_time: 1414ms, lr: 8.049457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:35,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.65706 samples/s/p 2:31:54 } +2024-07-30 03:36:38,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2932/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 8.046719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:38,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.66090 samples/s/p 2:31:45 } +2024-07-30 03:36:41,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2934/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 8.043978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:41,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.66033 samples/s/p 2:31:43 } +2024-07-30 03:36:44,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2936/ 3125], loss: 0.233, per_step_time: 1412ms, lr: 8.0412365e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:44,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.66190 samples/s/p 2:31:38 } +2024-07-30 03:36:47,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2938/ 3125], loss: 0.393, per_step_time: 1413ms, lr: 8.038493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:47,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.65971 samples/s/p 2:31:38 } +2024-07-30 03:36:49,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2940/ 3125], loss: 0.201, per_step_time: 1414ms, lr: 8.035749e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:49,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.65494 samples/s/p 2:31:43 } +2024-07-30 03:36:52,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2942/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 8.033003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:52,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.65944 samples/s/p 2:31:33 } +2024-07-30 03:36:55,513 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2944/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 8.030256e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:55,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.66064 samples/s/p 2:31:28 } +2024-07-30 03:36:58,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2946/ 3125], loss: 0.417, per_step_time: 1413ms, lr: 8.027507e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:36:58,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.65788 samples/s/p 2:31:30 } +2024-07-30 03:37:01,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2948/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 8.024756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:01,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.66003 samples/s/p 2:31:24 } +2024-07-30 03:37:04,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2950/ 3125], loss: 0.508, per_step_time: 1413ms, lr: 8.022005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:04,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.65774 samples/s/p 2:31:24 } +2024-07-30 03:37:06,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2952/ 3125], loss: 0.124, per_step_time: 1415ms, lr: 8.019252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:06,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.65159 samples/s/p 2:31:31 } +2024-07-30 03:37:09,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2954/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 8.016496e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:09,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.65967 samples/s/p 2:31:16 } +2024-07-30 03:37:12,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2956/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 8.013741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:12,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.66095 samples/s/p 2:31:11 } +2024-07-30 03:37:15,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2958/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 8.010983e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:15,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.66083 samples/s/p 2:31:08 } +2024-07-30 03:37:18,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2960/ 3125], loss: 0.058, per_step_time: 1413ms, lr: 8.008224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:18,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.65975 samples/s/p 2:31:07 } +2024-07-30 03:37:21,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2962/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 8.005464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:21,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.66074 samples/s/p 2:31:03 } +2024-07-30 03:37:23,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2964/ 3125], loss: 0.201, per_step_time: 1414ms, lr: 8.002702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:23,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.65380 samples/s/p 2:31:11 } +2024-07-30 03:37:26,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2966/ 3125], loss: 0.116, per_step_time: 1413ms, lr: 7.999938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:26,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.65947 samples/s/p 2:30:59 } +2024-07-30 03:37:29,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2968/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 7.997174e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:29,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.66019 samples/s/p 2:30:55 } +2024-07-30 03:37:32,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2970/ 3125], loss: 0.396, per_step_time: 1414ms, lr: 7.9944075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:32,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.65686 samples/s/p 2:30:58 } +2024-07-30 03:37:35,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2972/ 3125], loss: 0.248, per_step_time: 1414ms, lr: 7.991641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:35,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.65702 samples/s/p 2:30:54 } +2024-07-30 03:37:38,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2974/ 3125], loss: 0.402, per_step_time: 1415ms, lr: 7.988871e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:38,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.65371 samples/s/p 2:30:57 } +2024-07-30 03:37:40,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2976/ 3125], loss: 0.045, per_step_time: 1413ms, lr: 7.986101e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:40,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.66137 samples/s/p 2:30:42 } +2024-07-30 03:37:43,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2978/ 3125], loss: 0.486, per_step_time: 1413ms, lr: 7.983329e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:43,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.65908 samples/s/p 2:30:43 } +2024-07-30 03:37:46,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2980/ 3125], loss: 0.218, per_step_time: 1414ms, lr: 7.980555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:46,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.65677 samples/s/p 2:30:44 } +2024-07-30 03:37:49,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2982/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 7.977781e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:49,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.66055 samples/s/p 2:30:35 } +2024-07-30 03:37:52,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2984/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 7.975005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:52,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.66009 samples/s/p 2:30:33 } +2024-07-30 03:37:55,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2986/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 7.972229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:55,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.66101 samples/s/p 2:30:28 } +2024-07-30 03:37:57,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2988/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 7.969448e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:37:57,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.65816 samples/s/p 2:30:30 } +2024-07-30 03:38:00,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2990/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 7.966668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:00,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.66048 samples/s/p 2:30:23 } +2024-07-30 03:38:03,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2992/ 3125], loss: 0.206, per_step_time: 1415ms, lr: 7.963886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:03,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.65311 samples/s/p 2:30:32 } +2024-07-30 03:38:06,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2994/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 7.961103e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:06,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.65655 samples/s/p 2:30:24 } +2024-07-30 03:38:09,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2996/ 3125], loss: 0.146, per_step_time: 1414ms, lr: 7.958318e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:09,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |███████████████ | 5.65710 samples/s/p 2:30:20 } +2024-07-30 03:38:12,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 2998/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 7.955532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:12,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |███████████████ | 5.66026 samples/s/p 2:30:13 } +2024-07-30 03:38:14,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3000/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 7.952744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:14,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.66100 samples/s/p 2:30:09 } +2024-07-30 03:38:17,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3002/ 3125], loss: 0.105, per_step_time: 1413ms, lr: 7.949957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:17,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.65985 samples/s/p 2:30:08 } +2024-07-30 03:38:20,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3004/ 3125], loss: 0.164, per_step_time: 1413ms, lr: 7.9471665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:20,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.66051 samples/s/p 2:30:04 } +2024-07-30 03:38:23,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3006/ 3125], loss: 0.330, per_step_time: 1413ms, lr: 7.9443735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:23,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.66117 samples/s/p 2:30:00 } +2024-07-30 03:38:26,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3008/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 7.94158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:26,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.65914 samples/s/p 2:30:00 } +2024-07-30 03:38:29,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3010/ 3125], loss: 0.503, per_step_time: 1412ms, lr: 7.938786e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:29,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.66214 samples/s/p 2:29:53 } +2024-07-30 03:38:31,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3012/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 7.93599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:31,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.66085 samples/s/p 2:29:52 } +2024-07-30 03:38:34,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3014/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 7.933193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:34,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.65877 samples/s/p 2:29:52 } +2024-07-30 03:38:37,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3016/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 7.9303945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:37,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.65960 samples/s/p 2:29:48 } +2024-07-30 03:38:40,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3018/ 3125], loss: 0.073, per_step_time: 1413ms, lr: 7.927595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:40,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.66046 samples/s/p 2:29:44 } +2024-07-30 03:38:43,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3020/ 3125], loss: 0.311, per_step_time: 1415ms, lr: 7.924794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:43,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.65197 samples/s/p 2:29:55 } +2024-07-30 03:38:46,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3022/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 7.92199e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:46,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.65827 samples/s/p 2:29:42 } +2024-07-30 03:38:48,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3024/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 7.919186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:48,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.66124 samples/s/p 2:29:34 } +2024-07-30 03:38:51,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3026/ 3125], loss: 0.484, per_step_time: 1414ms, lr: 7.91638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:51,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.65641 samples/s/p 2:29:39 } +2024-07-30 03:38:54,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3028/ 3125], loss: 0.343, per_step_time: 1414ms, lr: 7.9135725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:54,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.65457 samples/s/p 2:29:39 } +2024-07-30 03:38:57,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3030/ 3125], loss: 0.262, per_step_time: 1414ms, lr: 7.910764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:38:57,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.65734 samples/s/p 2:29:32 } +2024-07-30 03:39:00,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3032/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 7.907955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:00,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.65672 samples/s/p 2:29:30 } +2024-07-30 03:39:03,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3034/ 3125], loss: 0.175, per_step_time: 1414ms, lr: 7.905143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:03,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.65419 samples/s/p 2:29:31 } +2024-07-30 03:39:05,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3036/ 3125], loss: 0.197, per_step_time: 1412ms, lr: 7.902331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:05,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.66179 samples/s/p 2:29:16 } +2024-07-30 03:39:08,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3038/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 7.899518e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:08,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.66116 samples/s/p 2:29:15 } +2024-07-30 03:39:11,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3040/ 3125], loss: 0.386, per_step_time: 1412ms, lr: 7.896702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:11,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.66330 samples/s/p 2:29:08 } +2024-07-30 03:39:14,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3042/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 7.893886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:14,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.65854 samples/s/p 2:29:13 } +2024-07-30 03:39:17,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3044/ 3125], loss: 0.133, per_step_time: 1412ms, lr: 7.891067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:17,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.66222 samples/s/p 2:29:04 } +2024-07-30 03:39:20,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3046/ 3125], loss: 0.483, per_step_time: 1413ms, lr: 7.888248e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:20,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.65951 samples/s/p 2:29:06 } +2024-07-30 03:39:22,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3048/ 3125], loss: 0.188, per_step_time: 1412ms, lr: 7.885426e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:22,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.66192 samples/s/p 2:28:59 } +2024-07-30 03:39:25,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3050/ 3125], loss: 0.253, per_step_time: 1412ms, lr: 7.882604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:25,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.66199 samples/s/p 2:28:56 } +2024-07-30 03:39:28,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3052/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 7.87978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:28,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.66158 samples/s/p 2:28:54 } +2024-07-30 03:39:31,405 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3054/ 3125], loss: 0.430, per_step_time: 1413ms, lr: 7.876955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:31,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.66018 samples/s/p 2:28:53 } +2024-07-30 03:39:34,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3056/ 3125], loss: 0.063, per_step_time: 1413ms, lr: 7.874129e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:34,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.66132 samples/s/p 2:28:49 } +2024-07-30 03:39:37,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3058/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 7.871301e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:37,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.65912 samples/s/p 2:28:50 } +2024-07-30 03:39:39,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3060/ 3125], loss: 0.244, per_step_time: 1412ms, lr: 7.8684725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:39,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.66296 samples/s/p 2:28:41 } +2024-07-30 03:39:42,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3062/ 3125], loss: 0.327, per_step_time: 1413ms, lr: 7.865641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:42,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.66004 samples/s/p 2:28:42 } +2024-07-30 03:39:45,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3064/ 3125], loss: 0.158, per_step_time: 1413ms, lr: 7.862808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:45,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.65888 samples/s/p 2:28:41 } +2024-07-30 03:39:48,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3066/ 3125], loss: 0.247, per_step_time: 1412ms, lr: 7.859976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:48,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.66233 samples/s/p 2:28:33 } +2024-07-30 03:39:51,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3068/ 3125], loss: 0.360, per_step_time: 1414ms, lr: 7.857141e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:51,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.65689 samples/s/p 2:28:39 } +2024-07-30 03:39:54,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3070/ 3125], loss: 0.408, per_step_time: 1415ms, lr: 7.854305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:54,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.65298 samples/s/p 2:28:42 } +2024-07-30 03:39:56,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3072/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 7.851468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:56,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.66026 samples/s/p 2:28:28 } +2024-07-30 03:39:59,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3074/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 7.84863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:39:59,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.65973 samples/s/p 2:28:26 } +2024-07-30 03:40:02,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3076/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 7.845789e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:02,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.65871 samples/s/p 2:28:25 } +2024-07-30 03:40:05,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3078/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 7.842948e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:05,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.66094 samples/s/p 2:28:18 } +2024-07-30 03:40:08,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3080/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 7.840105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:08,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.65950 samples/s/p 2:28:18 } +2024-07-30 03:40:11,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3082/ 3125], loss: 0.274, per_step_time: 1414ms, lr: 7.8372605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:11,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.65579 samples/s/p 2:28:21 } +2024-07-30 03:40:13,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3084/ 3125], loss: 0.207, per_step_time: 1414ms, lr: 7.834416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:13,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.65703 samples/s/p 2:28:16 } +2024-07-30 03:40:16,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3086/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 7.831569e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:16,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.66120 samples/s/p 2:28:07 } +2024-07-30 03:40:19,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3088/ 3125], loss: 0.198, per_step_time: 1412ms, lr: 7.82872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:19,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.66239 samples/s/p 2:28:02 } +2024-07-30 03:40:22,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3090/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 7.825871e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:22,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.66022 samples/s/p 2:28:03 } +2024-07-30 03:40:25,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3092/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 7.82302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:25,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.66083 samples/s/p 2:27:59 } +2024-07-30 03:40:28,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3094/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 7.820167e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:28,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.65863 samples/s/p 2:27:59 } +2024-07-30 03:40:30,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3096/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 7.817314e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:30,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.65941 samples/s/p 2:27:55 } +2024-07-30 03:40:33,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3098/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 7.814459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:33,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.65957 samples/s/p 2:27:52 } +2024-07-30 03:40:36,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3100/ 3125], loss: 0.094, per_step_time: 1413ms, lr: 7.811602e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:36,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.66062 samples/s/p 2:27:48 } +2024-07-30 03:40:39,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3102/ 3125], loss: 0.340, per_step_time: 1414ms, lr: 7.808745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:39,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.65742 samples/s/p 2:27:50 } +2024-07-30 03:40:42,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3104/ 3125], loss: 0.542, per_step_time: 1414ms, lr: 7.8058865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:42,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.65532 samples/s/p 2:27:50 } +2024-07-30 03:40:45,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3106/ 3125], loss: 0.421, per_step_time: 1413ms, lr: 7.803026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:45,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.66091 samples/s/p 2:27:39 } +2024-07-30 03:40:47,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3108/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 7.800165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:47,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.65950 samples/s/p 2:27:38 } +2024-07-30 03:40:50,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3110/ 3125], loss: 0.137, per_step_time: 1413ms, lr: 7.797301e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:50,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.66143 samples/s/p 2:27:32 } +2024-07-30 03:40:53,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3112/ 3125], loss: 0.390, per_step_time: 1413ms, lr: 7.794437e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:53,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.66107 samples/s/p 2:27:30 } +2024-07-30 03:40:56,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3114/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 7.791571e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:56,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.66017 samples/s/p 2:27:29 } +2024-07-30 03:40:59,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3116/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 7.788703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:40:59,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.66046 samples/s/p 2:27:25 } +2024-07-30 03:41:02,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3118/ 3125], loss: 0.107, per_step_time: 1414ms, lr: 7.785835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:02,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.65652 samples/s/p 2:27:29 } +2024-07-30 03:41:04,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3120/ 3125], loss: 0.323, per_step_time: 1413ms, lr: 7.782965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:04,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.65781 samples/s/p 2:27:24 } +2024-07-30 03:41:07,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3122/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 7.780095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:07,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.65889 samples/s/p 2:27:19 } +2024-07-30 03:41:10,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 3], step:[ 3124/ 3125], loss: 0.356, per_step_time: 1413ms, lr: 7.777224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:10,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.65844 samples/s/p 2:27:17 } +2024-07-30 03:41:13,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1/ 3125], loss: 0.339, per_step_time: 1414ms, lr: 7.774349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:13,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.65761 samples/s/p 2:27:16 } +2024-07-30 03:41:16,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3/ 3125], loss: 0.242, per_step_time: 1414ms, lr: 7.771474e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:16,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.65756 samples/s/p 2:27:13 } +2024-07-30 03:41:19,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 5/ 3125], loss: 0.122, per_step_time: 1413ms, lr: 7.768598e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:19,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.65995 samples/s/p 2:27:06 } +2024-07-30 03:41:21,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 7/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 7.7657205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:21,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.66045 samples/s/p 2:27:03 } +2024-07-30 03:41:24,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 9/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 7.762842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:24,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.65892 samples/s/p 2:27:02 } +2024-07-30 03:41:27,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 11/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 7.759961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:27,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.65799 samples/s/p 2:27:01 } +2024-07-30 03:41:30,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 13/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 7.757079e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:30,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.66155 samples/s/p 2:26:53 } +2024-07-30 03:41:33,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 15/ 3125], loss: 0.090, per_step_time: 1412ms, lr: 7.754197e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:33,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.66200 samples/s/p 2:26:49 } +2024-07-30 03:41:36,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 17/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 7.751312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:36,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.66021 samples/s/p 2:26:49 } +2024-07-30 03:41:38,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 19/ 3125], loss: 0.346, per_step_time: 1413ms, lr: 7.748427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:38,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.66113 samples/s/p 2:26:45 } +2024-07-30 03:41:41,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 21/ 3125], loss: 0.386, per_step_time: 1412ms, lr: 7.74554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:41,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.66199 samples/s/p 2:26:41 } +2024-07-30 03:41:44,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 23/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 7.742651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:44,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.66063 samples/s/p 2:26:40 } +2024-07-30 03:41:47,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 25/ 3125], loss: 0.442, per_step_time: 1413ms, lr: 7.739762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:47,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.65821 samples/s/p 2:26:41 } +2024-07-30 03:41:50,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 27/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 7.736871e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:50,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.65864 samples/s/p 2:26:37 } +2024-07-30 03:41:53,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 29/ 3125], loss: 0.158, per_step_time: 1413ms, lr: 7.733979e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:53,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.66157 samples/s/p 2:26:30 } +2024-07-30 03:41:55,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 31/ 3125], loss: 0.160, per_step_time: 1413ms, lr: 7.731086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:55,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.66015 samples/s/p 2:26:29 } +2024-07-30 03:41:58,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 33/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 7.728191e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:41:58,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.66017 samples/s/p 2:26:27 } +2024-07-30 03:42:01,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 35/ 3125], loss: 0.050, per_step_time: 1413ms, lr: 7.725296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:01,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.66121 samples/s/p 2:26:22 } +2024-07-30 03:42:04,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 37/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 7.7223995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:04,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.65883 samples/s/p 2:26:23 } +2024-07-30 03:42:07,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 39/ 3125], loss: 0.476, per_step_time: 1413ms, lr: 7.7195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:07,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.65846 samples/s/p 2:26:21 } +2024-07-30 03:42:10,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 41/ 3125], loss: 0.196, per_step_time: 1412ms, lr: 7.7166005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:10,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.66233 samples/s/p 2:26:12 } +2024-07-30 03:42:12,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 43/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 7.713699e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:12,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.66069 samples/s/p 2:26:12 } +2024-07-30 03:42:15,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 45/ 3125], loss: 0.356, per_step_time: 1413ms, lr: 7.710796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:15,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.65838 samples/s/p 2:26:12 } +2024-07-30 03:42:18,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 47/ 3125], loss: 0.262, per_step_time: 1414ms, lr: 7.707892e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:18,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.65623 samples/s/p 2:26:13 } +2024-07-30 03:42:21,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 49/ 3125], loss: 0.134, per_step_time: 1415ms, lr: 7.704987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:21,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.65369 samples/s/p 2:26:14 } +2024-07-30 03:42:24,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 51/ 3125], loss: 0.254, per_step_time: 1414ms, lr: 7.702081e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:24,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.65412 samples/s/p 2:26:10 } +2024-07-30 03:42:27,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 53/ 3125], loss: 0.330, per_step_time: 1414ms, lr: 7.699174e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:27,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.65612 samples/s/p 2:26:05 } +2024-07-30 03:42:29,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 55/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 7.696265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:29,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.66018 samples/s/p 2:25:55 } +2024-07-30 03:42:32,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 57/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 7.693354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:32,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.66154 samples/s/p 2:25:50 } +2024-07-30 03:42:35,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 59/ 3125], loss: 0.539, per_step_time: 1413ms, lr: 7.6904425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:35,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |████████████████ | 5.66122 samples/s/p 2:25:48 } +2024-07-30 03:42:38,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 61/ 3125], loss: 0.441, per_step_time: 1413ms, lr: 7.687529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:38,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |████████████████ | 5.65809 samples/s/p 2:25:50 } +2024-07-30 03:42:41,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 63/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 7.684615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:41,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.65826 samples/s/p 2:25:47 } +2024-07-30 03:42:44,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 65/ 3125], loss: 0.268, per_step_time: 1412ms, lr: 7.6817005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:44,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.66221 samples/s/p 2:25:38 } +2024-07-30 03:42:46,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 67/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 7.678784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:46,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.65823 samples/s/p 2:25:41 } +2024-07-30 03:42:49,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 69/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 7.675866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:49,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.65844 samples/s/p 2:25:38 } +2024-07-30 03:42:52,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 71/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 7.6729475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:52,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.65959 samples/s/p 2:25:34 } +2024-07-30 03:42:55,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 73/ 3125], loss: 0.266, per_step_time: 1425ms, lr: 7.670027e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:55,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.61304 samples/s/p 2:26:43 } +2024-07-30 03:42:58,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 75/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 7.667105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:42:58,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.66146 samples/s/p 2:25:25 } +2024-07-30 03:43:01,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 77/ 3125], loss: 0.197, per_step_time: 1413ms, lr: 7.664182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:01,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.65930 samples/s/p 2:25:26 } +2024-07-30 03:43:03,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 79/ 3125], loss: 0.398, per_step_time: 1413ms, lr: 7.661257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:03,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.65986 samples/s/p 2:25:22 } +2024-07-30 03:43:06,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 81/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 7.658331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:06,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.66095 samples/s/p 2:25:17 } +2024-07-30 03:43:09,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 83/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 7.655404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:09,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.66110 samples/s/p 2:25:14 } +2024-07-30 03:43:12,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 85/ 3125], loss: 0.280, per_step_time: 1412ms, lr: 7.652477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:12,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.66247 samples/s/p 2:25:09 } +2024-07-30 03:43:15,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 87/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 7.649548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:15,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.65897 samples/s/p 2:25:12 } +2024-07-30 03:43:18,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 89/ 3125], loss: 0.140, per_step_time: 1412ms, lr: 7.646618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:18,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.66240 samples/s/p 2:25:04 } +2024-07-30 03:43:20,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 91/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 7.643685e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:20,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.65961 samples/s/p 2:25:05 } +2024-07-30 03:43:23,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 93/ 3125], loss: 0.460, per_step_time: 1413ms, lr: 7.640752e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:23,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.66025 samples/s/p 2:25:02 } +2024-07-30 03:43:26,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 95/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 7.637817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:26,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.66153 samples/s/p 2:24:57 } +2024-07-30 03:43:29,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 97/ 3125], loss: 0.124, per_step_time: 1412ms, lr: 7.6348815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:29,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.66195 samples/s/p 2:24:53 } +2024-07-30 03:43:32,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 99/ 3125], loss: 0.180, per_step_time: 1414ms, lr: 7.631944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:32,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.65738 samples/s/p 2:24:58 } +2024-07-30 03:43:35,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 101/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 7.629007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:35,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.65778 samples/s/p 2:24:54 } +2024-07-30 03:43:37,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 103/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 7.626067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:37,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.65775 samples/s/p 2:24:51 } +2024-07-30 03:43:40,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 105/ 3125], loss: 0.223, per_step_time: 1414ms, lr: 7.6231267e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:40,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.65724 samples/s/p 2:24:49 } +2024-07-30 03:43:43,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 107/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 7.6201854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:43,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.65711 samples/s/p 2:24:47 } +2024-07-30 03:43:46,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 109/ 3125], loss: 0.124, per_step_time: 1413ms, lr: 7.6172423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:46,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.65965 samples/s/p 2:24:40 } +2024-07-30 03:43:49,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 111/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 7.614297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:49,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.65895 samples/s/p 2:24:38 } +2024-07-30 03:43:52,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 113/ 3125], loss: 0.330, per_step_time: 1413ms, lr: 7.6113506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:52,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.66088 samples/s/p 2:24:32 } +2024-07-30 03:43:54,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 115/ 3125], loss: 0.049, per_step_time: 1412ms, lr: 7.608404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:54,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.66294 samples/s/p 2:24:26 } +2024-07-30 03:43:57,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 117/ 3125], loss: 0.554, per_step_time: 1413ms, lr: 7.6054557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:43:57,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.65880 samples/s/p 2:24:30 } +2024-07-30 03:44:00,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 119/ 3125], loss: 0.228, per_step_time: 1425ms, lr: 7.6025067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:00,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.61146 samples/s/p 2:25:40 } +2024-07-30 03:44:03,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 121/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 7.5995563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:03,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.66123 samples/s/p 2:24:21 } +2024-07-30 03:44:06,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 123/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 7.5966045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:06,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.65819 samples/s/p 2:24:22 } +2024-07-30 03:44:09,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 125/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 7.5936505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:09,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.65910 samples/s/p 2:24:18 } +2024-07-30 03:44:12,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 127/ 3125], loss: 0.366, per_step_time: 1414ms, lr: 7.5906964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:12,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.65675 samples/s/p 2:24:19 } +2024-07-30 03:44:14,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 129/ 3125], loss: 0.126, per_step_time: 1414ms, lr: 7.5877415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:14,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.65728 samples/s/p 2:24:15 } +2024-07-30 03:44:17,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 131/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 7.5847843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:17,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.66063 samples/s/p 2:24:07 } +2024-07-30 03:44:20,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 133/ 3125], loss: 0.160, per_step_time: 1413ms, lr: 7.5818257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:20,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.65786 samples/s/p 2:24:09 } +2024-07-30 03:44:23,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 135/ 3125], loss: 0.249, per_step_time: 1414ms, lr: 7.578866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:23,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.65730 samples/s/p 2:24:07 } +2024-07-30 03:44:26,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 137/ 3125], loss: 0.145, per_step_time: 1413ms, lr: 7.5759062e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:26,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.65844 samples/s/p 2:24:02 } +2024-07-30 03:44:29,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 139/ 3125], loss: 0.216, per_step_time: 1415ms, lr: 7.5729445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:29,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.65318 samples/s/p 2:24:07 } +2024-07-30 03:44:31,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 141/ 3125], loss: 0.128, per_step_time: 1412ms, lr: 7.569982e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:31,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.66173 samples/s/p 2:23:51 } +2024-07-30 03:44:34,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 143/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 7.567018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:34,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.65839 samples/s/p 2:23:54 } +2024-07-30 03:44:37,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 145/ 3125], loss: 0.406, per_step_time: 1412ms, lr: 7.5640514e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:37,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.66271 samples/s/p 2:23:44 } +2024-07-30 03:44:40,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 147/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 7.5610837e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:40,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.65933 samples/s/p 2:23:47 } +2024-07-30 03:44:43,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 149/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 7.5581165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:43,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.66125 samples/s/p 2:23:41 } +2024-07-30 03:44:46,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 151/ 3125], loss: 0.153, per_step_time: 1412ms, lr: 7.555147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:46,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.66197 samples/s/p 2:23:37 } +2024-07-30 03:44:48,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 153/ 3125], loss: 0.151, per_step_time: 1413ms, lr: 7.5521775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:48,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.65901 samples/s/p 2:23:39 } +2024-07-30 03:44:51,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 155/ 3125], loss: 0.485, per_step_time: 1412ms, lr: 7.5492057e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:51,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.66272 samples/s/p 2:23:30 } +2024-07-30 03:44:54,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 157/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 7.5462335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:54,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.65945 samples/s/p 2:23:32 } +2024-07-30 03:44:57,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 159/ 3125], loss: 0.145, per_step_time: 1412ms, lr: 7.5432595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:44:57,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.66298 samples/s/p 2:23:24 } +2024-07-30 03:45:00,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 161/ 3125], loss: 0.241, per_step_time: 1412ms, lr: 7.5402836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:00,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.66306 samples/s/p 2:23:21 } +2024-07-30 03:45:03,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 163/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 7.5373077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:03,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.65886 samples/s/p 2:23:25 } +2024-07-30 03:45:05,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 165/ 3125], loss: 0.220, per_step_time: 1418ms, lr: 7.5343296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:05,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.63834 samples/s/p 2:23:53 } +2024-07-30 03:45:08,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 167/ 3125], loss: 0.382, per_step_time: 1413ms, lr: 7.5313505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:08,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.65811 samples/s/p 2:23:20 } +2024-07-30 03:45:11,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 169/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 7.5283706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:11,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.66129 samples/s/p 2:23:13 } +2024-07-30 03:45:14,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 171/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 7.525389e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:14,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.66127 samples/s/p 2:23:10 } +2024-07-30 03:45:17,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 173/ 3125], loss: 0.153, per_step_time: 1414ms, lr: 7.522407e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:17,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.65567 samples/s/p 2:23:15 } +2024-07-30 03:45:20,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 175/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 7.519424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:20,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.65992 samples/s/p 2:23:06 } +2024-07-30 03:45:22,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 177/ 3125], loss: 0.129, per_step_time: 1413ms, lr: 7.516439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:22,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.66056 samples/s/p 2:23:02 } +2024-07-30 03:45:25,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 179/ 3125], loss: 0.139, per_step_time: 1413ms, lr: 7.5134526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:25,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.66107 samples/s/p 2:22:59 } +2024-07-30 03:45:28,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 181/ 3125], loss: 0.536, per_step_time: 1414ms, lr: 7.5104654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:28,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.65452 samples/s/p 2:23:06 } +2024-07-30 03:45:31,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 183/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 7.5074754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:31,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.65778 samples/s/p 2:22:58 } +2024-07-30 03:45:34,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 185/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 7.5044863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:34,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.66117 samples/s/p 2:22:50 } +2024-07-30 03:45:37,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 187/ 3125], loss: 0.253, per_step_time: 1414ms, lr: 7.501496e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:37,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.65608 samples/s/p 2:22:55 } +2024-07-30 03:45:39,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 189/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 7.4985037e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:39,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.65984 samples/s/p 2:22:47 } +2024-07-30 03:45:42,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 191/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 7.495511e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:42,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.65866 samples/s/p 2:22:45 } +2024-07-30 03:45:45,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 193/ 3125], loss: 0.382, per_step_time: 1413ms, lr: 7.4925165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:45,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.65809 samples/s/p 2:22:44 } +2024-07-30 03:45:48,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 195/ 3125], loss: 0.408, per_step_time: 1414ms, lr: 7.4895215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:48,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.65755 samples/s/p 2:22:42 } +2024-07-30 03:45:51,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 197/ 3125], loss: 0.272, per_step_time: 1417ms, lr: 7.4865234e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:51,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.64455 samples/s/p 2:22:58 } +2024-07-30 03:45:54,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 199/ 3125], loss: 0.393, per_step_time: 1414ms, lr: 7.4835257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:54,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.65657 samples/s/p 2:22:37 } +2024-07-30 03:45:56,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 201/ 3125], loss: 0.027, per_step_time: 1414ms, lr: 7.4805257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:56,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.65735 samples/s/p 2:22:33 } +2024-07-30 03:45:59,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 203/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 7.4775253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:45:59,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.66079 samples/s/p 2:22:25 } +2024-07-30 03:46:02,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 205/ 3125], loss: 0.199, per_step_time: 1414ms, lr: 7.4745244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:02,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.65674 samples/s/p 2:22:29 } +2024-07-30 03:46:05,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 207/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 7.4715217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:05,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.66045 samples/s/p 2:22:20 } +2024-07-30 03:46:08,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 209/ 3125], loss: 0.076, per_step_time: 1413ms, lr: 7.4685177e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:08,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.66102 samples/s/p 2:22:16 } +2024-07-30 03:46:11,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 211/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 7.465513e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:11,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.65988 samples/s/p 2:22:15 } +2024-07-30 03:46:13,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 213/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 7.462506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:13,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.65904 samples/s/p 2:22:14 } +2024-07-30 03:46:16,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 215/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 7.4594986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:16,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.66171 samples/s/p 2:22:07 } +2024-07-30 03:46:19,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 217/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 7.45649e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:19,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.66003 samples/s/p 2:22:07 } +2024-07-30 03:46:22,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 219/ 3125], loss: 0.121, per_step_time: 1412ms, lr: 7.4534796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:22,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.66220 samples/s/p 2:22:01 } +2024-07-30 03:46:25,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 221/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 7.4504687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:25,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.66162 samples/s/p 2:21:59 } +2024-07-30 03:46:28,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 223/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 7.447457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:28,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.66129 samples/s/p 2:21:56 } +2024-07-30 03:46:30,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 225/ 3125], loss: 0.200, per_step_time: 1412ms, lr: 7.4444433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:30,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.66245 samples/s/p 2:21:52 } +2024-07-30 03:46:33,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 227/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 7.4414297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:33,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.65934 samples/s/p 2:21:54 } +2024-07-30 03:46:36,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 229/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 7.438414e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:36,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.66125 samples/s/p 2:21:48 } +2024-07-30 03:46:39,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 231/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 7.4353975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:39,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.66090 samples/s/p 2:21:46 } +2024-07-30 03:46:42,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 233/ 3125], loss: 0.202, per_step_time: 1414ms, lr: 7.432379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:42,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.65651 samples/s/p 2:21:49 } +2024-07-30 03:46:45,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 235/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 7.429359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:45,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.65893 samples/s/p 2:21:43 } +2024-07-30 03:46:47,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 237/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 7.4263385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:47,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.66005 samples/s/p 2:21:38 } +2024-07-30 03:46:50,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 239/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 7.423317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:50,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.66021 samples/s/p 2:21:35 } +2024-07-30 03:46:53,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 241/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 7.4202953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:53,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.66130 samples/s/p 2:21:31 } +2024-07-30 03:46:56,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 243/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 7.4172717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:56,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.65929 samples/s/p 2:21:31 } +2024-07-30 03:46:59,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 245/ 3125], loss: 0.160, per_step_time: 1416ms, lr: 7.4142467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:46:59,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.64622 samples/s/p 2:21:48 } +2024-07-30 03:47:02,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 247/ 3125], loss: 0.308, per_step_time: 1415ms, lr: 7.4112213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:02,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |█████████████████ | 5.65360 samples/s/p 2:21:34 } +2024-07-30 03:47:04,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 249/ 3125], loss: 0.176, per_step_time: 1413ms, lr: 7.408193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:04,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |█████████████████ | 5.65946 samples/s/p 2:21:22 } +2024-07-30 03:47:07,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 251/ 3125], loss: 0.422, per_step_time: 1412ms, lr: 7.4051645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:07,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.66181 samples/s/p 2:21:16 } +2024-07-30 03:47:10,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 253/ 3125], loss: 0.345, per_step_time: 1415ms, lr: 7.4021355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:10,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.65124 samples/s/p 2:21:29 } +2024-07-30 03:47:13,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 255/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 7.399104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:13,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.66044 samples/s/p 2:21:12 } +2024-07-30 03:47:16,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 257/ 3125], loss: 0.124, per_step_time: 1414ms, lr: 7.396072e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:16,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.65746 samples/s/p 2:21:14 } +2024-07-30 03:47:19,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 259/ 3125], loss: 0.261, per_step_time: 1415ms, lr: 7.393039e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:19,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.65160 samples/s/p 2:21:20 } +2024-07-30 03:47:21,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 261/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 7.3900055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:21,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.65807 samples/s/p 2:21:07 } +2024-07-30 03:47:24,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 263/ 3125], loss: 0.533, per_step_time: 1414ms, lr: 7.3869705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:24,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.65696 samples/s/p 2:21:06 } +2024-07-30 03:47:27,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 265/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 7.383934e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:27,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.66119 samples/s/p 2:20:57 } +2024-07-30 03:47:30,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 267/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 7.380896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:30,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.65991 samples/s/p 2:20:56 } +2024-07-30 03:47:33,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 269/ 3125], loss: 0.090, per_step_time: 1413ms, lr: 7.377857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:33,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.66077 samples/s/p 2:20:52 } +2024-07-30 03:47:36,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 271/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 7.374817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:36,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.65982 samples/s/p 2:20:51 } +2024-07-30 03:47:38,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 273/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 7.371776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:38,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.65886 samples/s/p 2:20:49 } +2024-07-30 03:47:41,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 275/ 3125], loss: 0.238, per_step_time: 1414ms, lr: 7.3687343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:41,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.65754 samples/s/p 2:20:48 } +2024-07-30 03:47:44,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 277/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 7.3656915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:44,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.66165 samples/s/p 2:20:39 } +2024-07-30 03:47:47,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 279/ 3125], loss: 0.249, per_step_time: 1414ms, lr: 7.3626475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:47,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.65759 samples/s/p 2:20:43 } +2024-07-30 03:47:50,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 281/ 3125], loss: 0.255, per_step_time: 1414ms, lr: 7.3596025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:50,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.65687 samples/s/p 2:20:41 } +2024-07-30 03:47:53,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 283/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 7.3565557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:53,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.65887 samples/s/p 2:20:35 } +2024-07-30 03:47:55,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 285/ 3125], loss: 0.257, per_step_time: 1412ms, lr: 7.353507e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:55,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.66190 samples/s/p 2:20:28 } +2024-07-30 03:47:58,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 287/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 7.350459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:47:58,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.65806 samples/s/p 2:20:31 } +2024-07-30 03:48:01,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 289/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 7.347408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:01,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.65919 samples/s/p 2:20:26 } +2024-07-30 03:48:04,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 291/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 7.344357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:04,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.66060 samples/s/p 2:20:21 } +2024-07-30 03:48:07,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 293/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 7.341305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:07,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.65798 samples/s/p 2:20:22 } +2024-07-30 03:48:10,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 295/ 3125], loss: 0.137, per_step_time: 1413ms, lr: 7.338252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:10,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.65849 samples/s/p 2:20:19 } +2024-07-30 03:48:12,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 297/ 3125], loss: 0.263, per_step_time: 1412ms, lr: 7.3351976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:12,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.66201 samples/s/p 2:20:11 } +2024-07-30 03:48:15,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 299/ 3125], loss: 0.336, per_step_time: 1412ms, lr: 7.3321426e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:15,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.66230 samples/s/p 2:20:07 } +2024-07-30 03:48:18,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 301/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 7.329085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:18,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.65870 samples/s/p 2:20:10 } +2024-07-30 03:48:21,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 303/ 3125], loss: 0.321, per_step_time: 1413ms, lr: 7.3260276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:21,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.65916 samples/s/p 2:20:06 } +2024-07-30 03:48:24,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 305/ 3125], loss: 0.338, per_step_time: 1425ms, lr: 7.3229676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:24,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.61298 samples/s/p 2:21:13 } +2024-07-30 03:48:27,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 307/ 3125], loss: 0.191, per_step_time: 1415ms, lr: 7.319908e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:27,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.65330 samples/s/p 2:20:09 } +2024-07-30 03:48:29,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 309/ 3125], loss: 0.320, per_step_time: 1413ms, lr: 7.3168467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:29,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.66062 samples/s/p 2:19:56 } +2024-07-30 03:48:32,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 311/ 3125], loss: 0.349, per_step_time: 1414ms, lr: 7.313785e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:32,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.65715 samples/s/p 2:19:58 } +2024-07-30 03:48:35,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 313/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 7.3107217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:35,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.65984 samples/s/p 2:19:51 } +2024-07-30 03:48:38,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 315/ 3125], loss: 0.327, per_step_time: 1412ms, lr: 7.307658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:38,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.66282 samples/s/p 2:19:44 } +2024-07-30 03:48:41,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 317/ 3125], loss: 0.287, per_step_time: 1415ms, lr: 7.3045926e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:41,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.65145 samples/s/p 2:19:58 } +2024-07-30 03:48:44,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 319/ 3125], loss: 0.253, per_step_time: 1412ms, lr: 7.301526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:44,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.66226 samples/s/p 2:19:39 } +2024-07-30 03:48:47,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 321/ 3125], loss: 0.260, per_step_time: 1414ms, lr: 7.2984576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:47,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.65417 samples/s/p 2:19:48 } +2024-07-30 03:48:49,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 323/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 7.2953876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:49,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.66123 samples/s/p 2:19:35 } +2024-07-30 03:48:52,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 325/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 7.292318e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:52,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.66075 samples/s/p 2:19:33 } +2024-07-30 03:48:55,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 327/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 7.289247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:55,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.65921 samples/s/p 2:19:32 } +2024-07-30 03:48:58,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 329/ 3125], loss: 0.272, per_step_time: 1414ms, lr: 7.2861753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:48:58,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.65679 samples/s/p 2:19:33 } +2024-07-30 03:49:01,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 331/ 3125], loss: 0.421, per_step_time: 1412ms, lr: 7.2831026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:01,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.66231 samples/s/p 2:19:22 } +2024-07-30 03:49:04,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 333/ 3125], loss: 0.387, per_step_time: 1413ms, lr: 7.280029e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:04,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.66096 samples/s/p 2:19:21 } +2024-07-30 03:49:06,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 335/ 3125], loss: 0.218, per_step_time: 1412ms, lr: 7.2769526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:06,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.66427 samples/s/p 2:19:14 } +2024-07-30 03:49:09,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 337/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 7.2738767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:09,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.65816 samples/s/p 2:19:20 } +2024-07-30 03:49:12,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 339/ 3125], loss: 0.399, per_step_time: 1413ms, lr: 7.270799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:12,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.65922 samples/s/p 2:19:15 } +2024-07-30 03:49:15,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 341/ 3125], loss: 0.279, per_step_time: 1415ms, lr: 7.2677194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:15,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.65205 samples/s/p 2:19:23 } +2024-07-30 03:49:18,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 343/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 7.2646403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:18,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.66054 samples/s/p 2:19:08 } +2024-07-30 03:49:21,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 345/ 3125], loss: 0.253, per_step_time: 1414ms, lr: 7.2615594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:21,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.65633 samples/s/p 2:19:11 } +2024-07-30 03:49:23,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 347/ 3125], loss: 0.124, per_step_time: 1414ms, lr: 7.2584776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:23,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.65716 samples/s/p 2:19:07 } +2024-07-30 03:49:26,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 349/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 7.255395e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:26,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.66076 samples/s/p 2:18:59 } +2024-07-30 03:49:29,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 351/ 3125], loss: 0.398, per_step_time: 1412ms, lr: 7.2523117e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:29,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.66181 samples/s/p 2:18:55 } +2024-07-30 03:49:32,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 353/ 3125], loss: 0.160, per_step_time: 1414ms, lr: 7.249226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:32,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.65647 samples/s/p 2:19:00 } +2024-07-30 03:49:35,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 355/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 7.2461407e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:35,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.65974 samples/s/p 2:18:52 } +2024-07-30 03:49:38,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 357/ 3125], loss: 0.162, per_step_time: 1414ms, lr: 7.2430526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:38,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.65383 samples/s/p 2:18:58 } +2024-07-30 03:49:40,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 359/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 7.2399635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:40,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.65935 samples/s/p 2:18:47 } +2024-07-30 03:49:43,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 361/ 3125], loss: 0.337, per_step_time: 1415ms, lr: 7.236874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:43,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.65344 samples/s/p 2:18:53 } +2024-07-30 03:49:46,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 363/ 3125], loss: 0.280, per_step_time: 1412ms, lr: 7.233784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:46,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.66176 samples/s/p 2:18:38 } +2024-07-30 03:49:49,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 365/ 3125], loss: 0.235, per_step_time: 1412ms, lr: 7.230693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:49,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.66199 samples/s/p 2:18:35 } +2024-07-30 03:49:52,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 367/ 3125], loss: 0.042, per_step_time: 1413ms, lr: 7.2276007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:52,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.66150 samples/s/p 2:18:32 } +2024-07-30 03:49:55,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 369/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 7.224507e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:55,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.66075 samples/s/p 2:18:31 } +2024-07-30 03:49:57,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 371/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 7.221411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:49:57,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.65914 samples/s/p 2:18:30 } +2024-07-30 03:50:00,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 373/ 3125], loss: 0.220, per_step_time: 1418ms, lr: 7.218316e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:00,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.63978 samples/s/p 2:18:56 } +2024-07-30 03:50:03,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 375/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 7.215219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:03,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.65956 samples/s/p 2:18:24 } +2024-07-30 03:50:06,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 377/ 3125], loss: 0.310, per_step_time: 1415ms, lr: 7.21212e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:06,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.65109 samples/s/p 2:18:34 } +2024-07-30 03:50:09,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 379/ 3125], loss: 0.083, per_step_time: 1413ms, lr: 7.209022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:09,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.66126 samples/s/p 2:18:16 } +2024-07-30 03:50:12,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 381/ 3125], loss: 0.318, per_step_time: 1412ms, lr: 7.205922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:12,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.66231 samples/s/p 2:18:12 } +2024-07-30 03:50:14,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 383/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 7.202821e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:14,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.66022 samples/s/p 2:18:12 } +2024-07-30 03:50:17,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 385/ 3125], loss: 0.288, per_step_time: 1414ms, lr: 7.199719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:17,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.65539 samples/s/p 2:18:16 } +2024-07-30 03:50:20,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 387/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 7.1966165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:20,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.65912 samples/s/p 2:18:08 } +2024-07-30 03:50:23,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 389/ 3125], loss: 0.102, per_step_time: 1415ms, lr: 7.193513e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:23,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.65096 samples/s/p 2:18:17 } +2024-07-30 03:50:26,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 391/ 3125], loss: 0.454, per_step_time: 1413ms, lr: 7.190406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:26,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.65944 samples/s/p 2:18:02 } +2024-07-30 03:50:29,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 393/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 7.1872996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:29,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.65981 samples/s/p 2:17:58 } +2024-07-30 03:50:31,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 395/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 7.184192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:31,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.66066 samples/s/p 2:17:54 } +2024-07-30 03:50:34,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 397/ 3125], loss: 0.102, per_step_time: 1413ms, lr: 7.181084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:34,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.66029 samples/s/p 2:17:52 } +2024-07-30 03:50:37,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 399/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 7.177975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:37,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.66091 samples/s/p 2:17:48 } +2024-07-30 03:50:40,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 401/ 3125], loss: 0.318, per_step_time: 1412ms, lr: 7.174864e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:40,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.66261 samples/s/p 2:17:43 } +2024-07-30 03:50:43,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 403/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 7.1717536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:43,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.65909 samples/s/p 2:17:45 } +2024-07-30 03:50:46,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 405/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 7.168641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:46,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.66016 samples/s/p 2:17:41 } +2024-07-30 03:50:48,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 407/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 7.1655268e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:48,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.65812 samples/s/p 2:17:41 } +2024-07-30 03:50:51,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 409/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 7.162412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:51,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.66097 samples/s/p 2:17:34 } +2024-07-30 03:50:54,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 411/ 3125], loss: 0.375, per_step_time: 1412ms, lr: 7.1592967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:54,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.66222 samples/s/p 2:17:29 } +2024-07-30 03:50:57,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 413/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 7.1561794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:50:57,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.66110 samples/s/p 2:17:28 } +2024-07-30 03:51:00,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 415/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 7.1530612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:00,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.66047 samples/s/p 2:17:26 } +2024-07-30 03:51:03,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 417/ 3125], loss: 0.052, per_step_time: 1413ms, lr: 7.149943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:03,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.66040 samples/s/p 2:17:23 } +2024-07-30 03:51:05,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 419/ 3125], loss: 0.373, per_step_time: 1413ms, lr: 7.146824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:05,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.65827 samples/s/p 2:17:24 } +2024-07-30 03:51:08,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 421/ 3125], loss: 0.194, per_step_time: 1412ms, lr: 7.1437034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:08,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.66260 samples/s/p 2:17:15 } +2024-07-30 03:51:11,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 423/ 3125], loss: 0.341, per_step_time: 1413ms, lr: 7.1405816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:11,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.65917 samples/s/p 2:17:17 } +2024-07-30 03:51:14,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 425/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 7.137458e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:14,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.65991 samples/s/p 2:17:13 } +2024-07-30 03:51:17,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 427/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 7.1343343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:17,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.65939 samples/s/p 2:17:11 } +2024-07-30 03:51:20,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 429/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 7.131209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:20,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.65876 samples/s/p 2:17:09 } +2024-07-30 03:51:22,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 431/ 3125], loss: 0.251, per_step_time: 1414ms, lr: 7.128083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:22,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.65486 samples/s/p 2:17:12 } +2024-07-30 03:51:25,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 433/ 3125], loss: 0.285, per_step_time: 1412ms, lr: 7.1249565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:25,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.66283 samples/s/p 2:16:57 } +2024-07-30 03:51:28,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 435/ 3125], loss: 0.294, per_step_time: 1414ms, lr: 7.1218287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:28,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.65630 samples/s/p 2:17:04 } +2024-07-30 03:51:31,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 437/ 3125], loss: 0.260, per_step_time: 1414ms, lr: 7.1187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:31,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.65402 samples/s/p 2:17:04 } +2024-07-30 03:51:34,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 439/ 3125], loss: 0.207, per_step_time: 1414ms, lr: 7.11557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:34,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |███████████████████ | 5.65692 samples/s/p 2:16:57 } +2024-07-30 03:51:37,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 441/ 3125], loss: 0.232, per_step_time: 1414ms, lr: 7.1124396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:37,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |███████████████████ | 5.65664 samples/s/p 2:16:55 } +2024-07-30 03:51:39,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 443/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 7.109307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:39,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.66170 samples/s/p 2:16:45 } +2024-07-30 03:51:42,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 445/ 3125], loss: 0.195, per_step_time: 1412ms, lr: 7.106174e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:42,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.66208 samples/s/p 2:16:41 } +2024-07-30 03:51:45,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 447/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 7.103039e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:45,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.65942 samples/s/p 2:16:42 } +2024-07-30 03:51:48,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 449/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 7.0999045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:48,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.65869 samples/s/p 2:16:41 } +2024-07-30 03:51:51,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 451/ 3125], loss: 0.402, per_step_time: 1412ms, lr: 7.0967685e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:51,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.66268 samples/s/p 2:16:32 } +2024-07-30 03:51:54,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 453/ 3125], loss: 0.338, per_step_time: 1414ms, lr: 7.093632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:54,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.65668 samples/s/p 2:16:38 } +2024-07-30 03:51:56,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 455/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 7.0904944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:56,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.66081 samples/s/p 2:16:29 } +2024-07-30 03:51:59,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 457/ 3125], loss: 0.281, per_step_time: 1412ms, lr: 7.0873557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:51:59,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.66255 samples/s/p 2:16:24 } +2024-07-30 03:52:02,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 459/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 7.0842143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:02,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.66069 samples/s/p 2:16:24 } +2024-07-30 03:52:05,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 461/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 7.081074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:05,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.66065 samples/s/p 2:16:21 } +2024-07-30 03:52:08,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 463/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 7.077932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:08,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.66103 samples/s/p 2:16:18 } +2024-07-30 03:52:11,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 465/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 7.0747888e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:11,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.66100 samples/s/p 2:16:15 } +2024-07-30 03:52:13,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 467/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 7.071645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:13,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.65895 samples/s/p 2:16:15 } +2024-07-30 03:52:16,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 469/ 3125], loss: 0.520, per_step_time: 1413ms, lr: 7.0685005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:16,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.65987 samples/s/p 2:16:11 } +2024-07-30 03:52:19,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 471/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 7.0653537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:19,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.65835 samples/s/p 2:16:10 } +2024-07-30 03:52:22,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 473/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 7.0622073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:22,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.66058 samples/s/p 2:16:04 } +2024-07-30 03:52:25,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 475/ 3125], loss: 0.113, per_step_time: 1413ms, lr: 7.0590595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:25,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.65859 samples/s/p 2:16:04 } +2024-07-30 03:52:28,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 477/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 7.055911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:28,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.65950 samples/s/p 2:16:00 } +2024-07-30 03:52:30,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 479/ 3125], loss: 0.259, per_step_time: 1415ms, lr: 7.0527603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:30,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.65344 samples/s/p 2:16:06 } +2024-07-30 03:52:33,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 481/ 3125], loss: 0.377, per_step_time: 1413ms, lr: 7.0496094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:33,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.65830 samples/s/p 2:15:56 } +2024-07-30 03:52:36,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 483/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 7.046458e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:36,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.66127 samples/s/p 2:15:49 } +2024-07-30 03:52:39,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 485/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 7.043305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:39,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.66051 samples/s/p 2:15:47 } +2024-07-30 03:52:42,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 487/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 7.040151e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:42,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.66093 samples/s/p 2:15:44 } +2024-07-30 03:52:45,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 489/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 7.036997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:45,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.66057 samples/s/p 2:15:41 } +2024-07-30 03:52:47,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 491/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 7.033841e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:47,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.65970 samples/s/p 2:15:40 } +2024-07-30 03:52:50,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 493/ 3125], loss: 0.356, per_step_time: 1413ms, lr: 7.0306837e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:50,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.66105 samples/s/p 2:15:35 } +2024-07-30 03:52:53,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 495/ 3125], loss: 0.251, per_step_time: 1412ms, lr: 7.0275264e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:53,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.66227 samples/s/p 2:15:31 } +2024-07-30 03:52:56,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 497/ 3125], loss: 0.416, per_step_time: 1413ms, lr: 7.0243677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:56,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.66121 samples/s/p 2:15:29 } +2024-07-30 03:52:59,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 499/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 7.0212086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:52:59,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.66153 samples/s/p 2:15:26 } +2024-07-30 03:53:02,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 501/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 7.018047e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:02,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.65852 samples/s/p 2:15:27 } +2024-07-30 03:53:04,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 503/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 7.014886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:04,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.65586 samples/s/p 2:15:28 } +2024-07-30 03:53:07,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 505/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 7.0117235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:07,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.66026 samples/s/p 2:15:19 } +2024-07-30 03:53:10,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 507/ 3125], loss: 0.252, per_step_time: 1412ms, lr: 7.0085603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:10,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.66298 samples/s/p 2:15:13 } +2024-07-30 03:53:13,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 509/ 3125], loss: 0.103, per_step_time: 1414ms, lr: 7.0053957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:13,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.65412 samples/s/p 2:15:22 } +2024-07-30 03:53:16,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 511/ 3125], loss: 0.140, per_step_time: 1414ms, lr: 7.0022306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:16,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.65534 samples/s/p 2:15:18 } +2024-07-30 03:53:19,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 513/ 3125], loss: 0.333, per_step_time: 1414ms, lr: 6.9990638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:19,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.65705 samples/s/p 2:15:13 } +2024-07-30 03:53:21,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 515/ 3125], loss: 0.159, per_step_time: 1412ms, lr: 6.9958965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:21,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.66218 samples/s/p 2:15:02 } +2024-07-30 03:53:24,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 517/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 6.9927287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:24,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.65996 samples/s/p 2:15:03 } +2024-07-30 03:53:27,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 519/ 3125], loss: 0.437, per_step_time: 1413ms, lr: 6.9895596e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:27,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.66120 samples/s/p 2:14:58 } +2024-07-30 03:53:30,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 521/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 6.9863895e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:30,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.65973 samples/s/p 2:14:57 } +2024-07-30 03:53:33,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 523/ 3125], loss: 0.258, per_step_time: 1420ms, lr: 6.983218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:33,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.63199 samples/s/p 2:15:34 } +2024-07-30 03:53:36,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 525/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 6.980046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:36,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.65912 samples/s/p 2:14:53 } +2024-07-30 03:53:38,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 527/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 6.976873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:38,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.66070 samples/s/p 2:14:48 } +2024-07-30 03:53:41,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 529/ 3125], loss: 0.346, per_step_time: 1413ms, lr: 6.9736993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:41,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.65882 samples/s/p 2:14:47 } +2024-07-30 03:53:44,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 531/ 3125], loss: 0.420, per_step_time: 1413ms, lr: 6.9705247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:44,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.65967 samples/s/p 2:14:43 } +2024-07-30 03:53:47,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 533/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 6.967349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:47,448 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.65792 samples/s/p 2:14:43 } +2024-07-30 03:53:50,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 535/ 3125], loss: 0.098, per_step_time: 1414ms, lr: 6.964172e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:50,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.65399 samples/s/p 2:14:46 } +2024-07-30 03:53:53,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 537/ 3125], loss: 0.678, per_step_time: 1413ms, lr: 6.9609937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:53,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.65817 samples/s/p 2:14:37 } +2024-07-30 03:53:55,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 539/ 3125], loss: 0.108, per_step_time: 1413ms, lr: 6.957816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:55,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.66008 samples/s/p 2:14:31 } +2024-07-30 03:53:58,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 541/ 3125], loss: 0.110, per_step_time: 1413ms, lr: 6.9546363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:53:58,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.65891 samples/s/p 2:14:30 } +2024-07-30 03:54:01,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 543/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 6.9514554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:01,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.66027 samples/s/p 2:14:26 } +2024-07-30 03:54:04,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 545/ 3125], loss: 0.292, per_step_time: 1413ms, lr: 6.9482744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:04,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.65957 samples/s/p 2:14:24 } +2024-07-30 03:54:07,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 547/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 6.945091e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:07,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.66029 samples/s/p 2:14:20 } +2024-07-30 03:54:10,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 549/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 6.9419084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:10,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.66110 samples/s/p 2:14:16 } +2024-07-30 03:54:12,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 551/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 6.9387243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:12,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.66051 samples/s/p 2:14:14 } +2024-07-30 03:54:15,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 553/ 3125], loss: 0.216, per_step_time: 1416ms, lr: 6.935539e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:15,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.64676 samples/s/p 2:14:31 } +2024-07-30 03:54:18,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 555/ 3125], loss: 0.210, per_step_time: 1412ms, lr: 6.9323532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:18,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.66208 samples/s/p 2:14:06 } +2024-07-30 03:54:21,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 557/ 3125], loss: 0.150, per_step_time: 1414ms, lr: 6.929166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:21,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.65742 samples/s/p 2:14:10 } +2024-07-30 03:54:24,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 559/ 3125], loss: 0.148, per_step_time: 1413ms, lr: 6.9259777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:24,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.66043 samples/s/p 2:14:03 } +2024-07-30 03:54:27,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 561/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 6.9227895e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:27,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.66044 samples/s/p 2:14:00 } +2024-07-30 03:54:29,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 563/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 6.9195994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:29,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.66140 samples/s/p 2:13:56 } +2024-07-30 03:54:32,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 565/ 3125], loss: 0.587, per_step_time: 1413ms, lr: 6.916409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:32,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.66001 samples/s/p 2:13:55 } +2024-07-30 03:54:35,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 567/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 6.913218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:35,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.65794 samples/s/p 2:13:55 } +2024-07-30 03:54:38,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 569/ 3125], loss: 0.142, per_step_time: 1413ms, lr: 6.9100247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:38,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.65895 samples/s/p 2:13:51 } +2024-07-30 03:54:41,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 571/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 6.9068315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:41,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.65918 samples/s/p 2:13:48 } +2024-07-30 03:54:44,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 573/ 3125], loss: 0.064, per_step_time: 1417ms, lr: 6.9036373e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:44,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.64554 samples/s/p 2:14:04 } +2024-07-30 03:54:46,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 575/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 6.9004423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:46,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.66109 samples/s/p 2:13:39 } +2024-07-30 03:54:49,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 577/ 3125], loss: 0.460, per_step_time: 1413ms, lr: 6.8972463e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:49,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.65884 samples/s/p 2:13:40 } +2024-07-30 03:54:52,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 579/ 3125], loss: 0.125, per_step_time: 1412ms, lr: 6.894049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:52,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.66191 samples/s/p 2:13:32 } +2024-07-30 03:54:55,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 581/ 3125], loss: 0.071, per_step_time: 1413ms, lr: 6.8908503e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:55,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.66094 samples/s/p 2:13:31 } +2024-07-30 03:54:58,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 583/ 3125], loss: 0.261, per_step_time: 1415ms, lr: 6.887652e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:54:58,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.65327 samples/s/p 2:13:39 } +2024-07-30 03:55:01,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 585/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 6.8844524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:01,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.65898 samples/s/p 2:13:28 } +2024-07-30 03:55:03,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 587/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 6.881252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:03,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.66148 samples/s/p 2:13:22 } +2024-07-30 03:55:06,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 589/ 3125], loss: 0.097, per_step_time: 1413ms, lr: 6.8780505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:06,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.65771 samples/s/p 2:13:24 } +2024-07-30 03:55:09,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 591/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 6.8748477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:09,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.66004 samples/s/p 2:13:18 } +2024-07-30 03:55:12,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 593/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 6.8716445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:12,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.66049 samples/s/p 2:13:15 } +2024-07-30 03:55:15,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 595/ 3125], loss: 0.161, per_step_time: 1414ms, lr: 6.8684403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:15,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.65652 samples/s/p 2:13:17 } +2024-07-30 03:55:18,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 597/ 3125], loss: 0.225, per_step_time: 1418ms, lr: 6.8652353e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:18,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.63986 samples/s/p 2:13:38 } +2024-07-30 03:55:21,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 599/ 3125], loss: 0.277, per_step_time: 1426ms, lr: 6.8620293e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:21,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.60817 samples/s/p 2:14:21 } +2024-07-30 03:55:23,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 601/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 6.858822e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:23,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.65852 samples/s/p 2:13:06 } +2024-07-30 03:55:26,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 603/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 6.855614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:26,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.65846 samples/s/p 2:13:03 } +2024-07-30 03:55:29,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 605/ 3125], loss: 0.471, per_step_time: 1413ms, lr: 6.852406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:29,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.65879 samples/s/p 2:13:00 } +2024-07-30 03:55:32,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 607/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 6.8491963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:32,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.65945 samples/s/p 2:12:56 } +2024-07-30 03:55:35,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 609/ 3125], loss: 0.238, per_step_time: 1414ms, lr: 6.8459854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:35,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.65715 samples/s/p 2:12:57 } +2024-07-30 03:55:38,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 611/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 6.8427744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:38,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.65790 samples/s/p 2:12:53 } +2024-07-30 03:55:40,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 613/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 6.8395625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:40,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.65911 samples/s/p 2:12:48 } +2024-07-30 03:55:43,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 615/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 6.836349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:43,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.65994 samples/s/p 2:12:44 } +2024-07-30 03:55:46,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 617/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 6.833135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:46,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.65897 samples/s/p 2:12:43 } +2024-07-30 03:55:49,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 619/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 6.829921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:49,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.66002 samples/s/p 2:12:38 } +2024-07-30 03:55:52,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 621/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 6.826705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:52,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |███████████████████ | 5.66052 samples/s/p 2:12:35 } +2024-07-30 03:55:55,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 623/ 3125], loss: 0.142, per_step_time: 1413ms, lr: 6.823488e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:55,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |███████████████████ | 5.66114 samples/s/p 2:12:31 } +2024-07-30 03:55:57,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 625/ 3125], loss: 0.120, per_step_time: 1413ms, lr: 6.8202708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:55:57,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.66018 samples/s/p 2:12:30 } +2024-07-30 03:56:00,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 627/ 3125], loss: 0.379, per_step_time: 1414ms, lr: 6.817053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:00,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.65766 samples/s/p 2:12:30 } +2024-07-30 03:56:03,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 629/ 3125], loss: 0.368, per_step_time: 1413ms, lr: 6.8138334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:03,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.65868 samples/s/p 2:12:26 } +2024-07-30 03:56:06,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 631/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 6.8106133e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:06,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.65871 samples/s/p 2:12:23 } +2024-07-30 03:56:09,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 633/ 3125], loss: 0.124, per_step_time: 1414ms, lr: 6.8073928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:09,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.65685 samples/s/p 2:12:23 } +2024-07-30 03:56:12,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 635/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 6.804171e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:12,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.65460 samples/s/p 2:12:23 } +2024-07-30 03:56:14,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 637/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 6.8009476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:14,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.65932 samples/s/p 2:12:14 } +2024-07-30 03:56:17,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 639/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 6.7977244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:17,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.65855 samples/s/p 2:12:12 } +2024-07-30 03:56:20,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 641/ 3125], loss: 0.334, per_step_time: 1413ms, lr: 6.7945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:20,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.66106 samples/s/p 2:12:06 } +2024-07-30 03:56:23,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 643/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 6.7912756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:23,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.66112 samples/s/p 2:12:03 } +2024-07-30 03:56:26,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 645/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 6.788049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:26,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.66005 samples/s/p 2:12:02 } +2024-07-30 03:56:29,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 647/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 6.7848214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:29,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.65962 samples/s/p 2:11:59 } +2024-07-30 03:56:31,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 649/ 3125], loss: 0.085, per_step_time: 1417ms, lr: 6.7815945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:31,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.64200 samples/s/p 2:12:21 } +2024-07-30 03:56:34,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 651/ 3125], loss: 0.368, per_step_time: 1413ms, lr: 6.7783653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:34,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.66076 samples/s/p 2:11:52 } +2024-07-30 03:56:37,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 653/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 6.7751357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:37,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.65934 samples/s/p 2:11:51 } +2024-07-30 03:56:40,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 655/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 6.7719066e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:40,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.66171 samples/s/p 2:11:45 } +2024-07-30 03:56:43,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 657/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 6.768675e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:43,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.66099 samples/s/p 2:11:43 } +2024-07-30 03:56:46,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 659/ 3125], loss: 0.151, per_step_time: 1413ms, lr: 6.7654423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:46,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.66028 samples/s/p 2:11:42 } +2024-07-30 03:56:48,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 661/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 6.76221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:48,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.65964 samples/s/p 2:11:40 } +2024-07-30 03:56:51,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 663/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 6.7589763e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:51,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.65997 samples/s/p 2:11:36 } +2024-07-30 03:56:54,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 665/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 6.7557417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:54,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.65982 samples/s/p 2:11:34 } +2024-07-30 03:56:57,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 667/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 6.752506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:56:57,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.65972 samples/s/p 2:11:31 } +2024-07-30 03:57:00,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 669/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 6.7492706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:00,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.66141 samples/s/p 2:11:26 } +2024-07-30 03:57:03,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 671/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 6.7460333e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:03,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.66111 samples/s/p 2:11:23 } +2024-07-30 03:57:05,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 673/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 6.742795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:05,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.66001 samples/s/p 2:11:22 } +2024-07-30 03:57:08,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 675/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 6.7395567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:08,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.65848 samples/s/p 2:11:21 } +2024-07-30 03:57:11,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 677/ 3125], loss: 0.427, per_step_time: 1413ms, lr: 6.736317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:11,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.65804 samples/s/p 2:11:19 } +2024-07-30 03:57:14,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 679/ 3125], loss: 0.160, per_step_time: 1414ms, lr: 6.733077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:14,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.65432 samples/s/p 2:11:22 } +2024-07-30 03:57:17,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 681/ 3125], loss: 0.150, per_step_time: 1414ms, lr: 6.7298356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:17,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.65763 samples/s/p 2:11:14 } +2024-07-30 03:57:20,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 683/ 3125], loss: 0.352, per_step_time: 1414ms, lr: 6.7265933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:20,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.65707 samples/s/p 2:11:12 } +2024-07-30 03:57:22,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 685/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 6.723351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:22,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.66164 samples/s/p 2:11:03 } +2024-07-30 03:57:25,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 687/ 3125], loss: 0.426, per_step_time: 1413ms, lr: 6.7201063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:25,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.65942 samples/s/p 2:11:03 } +2024-07-30 03:57:28,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 689/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 6.7168626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:28,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.65994 samples/s/p 2:11:00 } +2024-07-30 03:57:31,405 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 691/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 6.7136175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:31,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.66146 samples/s/p 2:10:55 } +2024-07-30 03:57:34,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 693/ 3125], loss: 0.261, per_step_time: 1414ms, lr: 6.710371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:34,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.65519 samples/s/p 2:11:01 } +2024-07-30 03:57:37,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 695/ 3125], loss: 0.328, per_step_time: 1417ms, lr: 6.707124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:37,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.64542 samples/s/p 2:11:11 } +2024-07-30 03:57:39,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 697/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 6.703876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:39,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.65790 samples/s/p 2:10:51 } +2024-07-30 03:57:42,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 699/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 6.700628e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:42,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.65825 samples/s/p 2:10:48 } +2024-07-30 03:57:45,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 701/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 6.6973794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:45,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.66040 samples/s/p 2:10:42 } +2024-07-30 03:57:48,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 703/ 3125], loss: 0.323, per_step_time: 1414ms, lr: 6.6941284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:48,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.65711 samples/s/p 2:10:44 } +2024-07-30 03:57:51,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 705/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 6.690877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:51,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.65902 samples/s/p 2:10:38 } +2024-07-30 03:57:54,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 707/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 6.6876255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:54,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.66149 samples/s/p 2:10:32 } +2024-07-30 03:57:56,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 709/ 3125], loss: 0.424, per_step_time: 1412ms, lr: 6.6843727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:56,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.66184 samples/s/p 2:10:29 } +2024-07-30 03:57:59,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 711/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 6.681119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:57:59,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.66069 samples/s/p 2:10:28 } +2024-07-30 03:58:02,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 713/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 6.6778657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:02,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.66002 samples/s/p 2:10:26 } +2024-07-30 03:58:05,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 715/ 3125], loss: 0.368, per_step_time: 1412ms, lr: 6.67461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:05,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.66321 samples/s/p 2:10:18 } +2024-07-30 03:58:08,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 717/ 3125], loss: 0.139, per_step_time: 1412ms, lr: 6.671354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:08,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.66269 samples/s/p 2:10:16 } +2024-07-30 03:58:11,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 719/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 6.6680977e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:11,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.66027 samples/s/p 2:10:17 } +2024-07-30 03:58:13,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 721/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 6.6648404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:13,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.65912 samples/s/p 2:10:16 } +2024-07-30 03:58:16,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 723/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 6.6615817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:16,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.65881 samples/s/p 2:10:13 } +2024-07-30 03:58:19,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 725/ 3125], loss: 0.420, per_step_time: 1416ms, lr: 6.6583234e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:19,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.64971 samples/s/p 2:10:23 } +2024-07-30 03:58:22,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 727/ 3125], loss: 0.105, per_step_time: 1414ms, lr: 6.6550633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:22,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.65615 samples/s/p 2:10:11 } +2024-07-30 03:58:25,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 729/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 6.6518032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:25,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.66064 samples/s/p 2:10:02 } +2024-07-30 03:58:28,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 731/ 3125], loss: 0.259, per_step_time: 1412ms, lr: 6.648541e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:28,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.66232 samples/s/p 2:09:57 } +2024-07-30 03:58:30,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 733/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 6.6452794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:30,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.66119 samples/s/p 2:09:56 } +2024-07-30 03:58:33,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 735/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 6.6420166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:33,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.66085 samples/s/p 2:09:53 } +2024-07-30 03:58:36,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 737/ 3125], loss: 0.189, per_step_time: 1414ms, lr: 6.6387524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:36,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.65588 samples/s/p 2:09:57 } +2024-07-30 03:58:39,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 739/ 3125], loss: 0.179, per_step_time: 1414ms, lr: 6.6354874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:39,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.65670 samples/s/p 2:09:53 } +2024-07-30 03:58:42,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 741/ 3125], loss: 0.483, per_step_time: 1413ms, lr: 6.632223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:42,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.65820 samples/s/p 2:09:49 } +2024-07-30 03:58:45,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 743/ 3125], loss: 0.356, per_step_time: 1413ms, lr: 6.6289567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:45,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.65785 samples/s/p 2:09:46 } +2024-07-30 03:58:47,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 745/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 6.62569e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:47,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.65996 samples/s/p 2:09:40 } +2024-07-30 03:58:50,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 747/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 6.622422e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:50,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.66097 samples/s/p 2:09:36 } +2024-07-30 03:58:53,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 749/ 3125], loss: 0.377, per_step_time: 1413ms, lr: 6.6191533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:53,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.66042 samples/s/p 2:09:34 } +2024-07-30 03:58:56,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 751/ 3125], loss: 0.137, per_step_time: 1413ms, lr: 6.6158846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:56,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.66029 samples/s/p 2:09:32 } +2024-07-30 03:58:59,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 753/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 6.612614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:58:59,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.66121 samples/s/p 2:09:27 } +2024-07-30 03:59:02,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 755/ 3125], loss: 0.384, per_step_time: 1413ms, lr: 6.6093444e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:02,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.66110 samples/s/p 2:09:25 } +2024-07-30 03:59:04,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 757/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 6.6060725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:04,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.66135 samples/s/p 2:09:22 } +2024-07-30 03:59:07,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 759/ 3125], loss: 0.215, per_step_time: 1412ms, lr: 6.6028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:07,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.66178 samples/s/p 2:09:18 } +2024-07-30 03:59:10,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 761/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 6.599527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:10,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.66166 samples/s/p 2:09:16 } +2024-07-30 03:59:13,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 763/ 3125], loss: 0.551, per_step_time: 1412ms, lr: 6.5962536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:13,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.66172 samples/s/p 2:09:13 } +2024-07-30 03:59:16,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 765/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 6.5929794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:16,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.65963 samples/s/p 2:09:13 } +2024-07-30 03:59:19,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 767/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 6.5897034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:19,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.66023 samples/s/p 2:09:09 } +2024-07-30 03:59:21,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 769/ 3125], loss: 0.385, per_step_time: 1413ms, lr: 6.5864274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:21,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.65794 samples/s/p 2:09:09 } +2024-07-30 03:59:24,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 771/ 3125], loss: 0.358, per_step_time: 1415ms, lr: 6.5831505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:24,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.65303 samples/s/p 2:09:13 } +2024-07-30 03:59:27,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 773/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 6.5798736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:27,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.65945 samples/s/p 2:09:02 } +2024-07-30 03:59:30,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 775/ 3125], loss: 0.327, per_step_time: 1413ms, lr: 6.5765944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:30,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.66116 samples/s/p 2:08:56 } +2024-07-30 03:59:33,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 777/ 3125], loss: 0.330, per_step_time: 1413ms, lr: 6.5733157e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:33,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.65894 samples/s/p 2:08:57 } +2024-07-30 03:59:36,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 779/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 6.570036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:36,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.65793 samples/s/p 2:08:55 } +2024-07-30 03:59:38,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 781/ 3125], loss: 0.368, per_step_time: 1412ms, lr: 6.5667555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:38,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.66201 samples/s/p 2:08:47 } +2024-07-30 03:59:41,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 783/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 6.5634736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:41,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.66087 samples/s/p 2:08:46 } +2024-07-30 03:59:44,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 785/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 6.560192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:44,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.65860 samples/s/p 2:08:46 } +2024-07-30 03:59:47,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 787/ 3125], loss: 0.200, per_step_time: 1414ms, lr: 6.556909e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:47,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.65552 samples/s/p 2:08:47 } +2024-07-30 03:59:50,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 789/ 3125], loss: 0.394, per_step_time: 1413ms, lr: 6.553625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:50,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.65847 samples/s/p 2:08:40 } +2024-07-30 03:59:53,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 791/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 6.550342e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:53,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.66128 samples/s/p 2:08:34 } +2024-07-30 03:59:55,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 793/ 3125], loss: 0.298, per_step_time: 1414ms, lr: 6.5470563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:55,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.65702 samples/s/p 2:08:37 } +2024-07-30 03:59:58,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 795/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 6.5437703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 03:59:58,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.66112 samples/s/p 2:08:28 } +2024-07-30 04:00:01,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 797/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 6.540484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:01,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.65963 samples/s/p 2:08:27 } +2024-07-30 04:00:04,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 799/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 6.5371964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:04,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.66038 samples/s/p 2:08:24 } +2024-07-30 04:00:07,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 801/ 3125], loss: 0.258, per_step_time: 1445ms, lr: 6.5339086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:07,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.53622 samples/s/p 2:11:13 } +2024-07-30 04:00:10,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 803/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 6.53062e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:10,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.66129 samples/s/p 2:08:17 } +2024-07-30 04:00:13,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 805/ 3125], loss: 0.134, per_step_time: 1413ms, lr: 6.5273302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:13,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.65837 samples/s/p 2:08:18 } +2024-07-30 04:00:15,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 807/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 6.5240406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:15,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.65887 samples/s/p 2:08:14 } +2024-07-30 04:00:18,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 809/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 6.5207496e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:18,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |████████████████████ | 5.66156 samples/s/p 2:08:08 } +2024-07-30 04:00:21,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 811/ 3125], loss: 0.194, per_step_time: 1412ms, lr: 6.5174577e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:21,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |████████████████████ | 5.66363 samples/s/p 2:08:02 } +2024-07-30 04:00:24,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 813/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 6.5141653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:24,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.66004 samples/s/p 2:08:04 } +2024-07-30 04:00:27,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 815/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 6.510872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:27,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.66124 samples/s/p 2:08:00 } +2024-07-30 04:00:30,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 817/ 3125], loss: 0.292, per_step_time: 1413ms, lr: 6.507578e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:30,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.65990 samples/s/p 2:07:59 } +2024-07-30 04:00:32,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 819/ 3125], loss: 0.129, per_step_time: 1413ms, lr: 6.504284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:32,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.65940 samples/s/p 2:07:57 } +2024-07-30 04:00:35,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 821/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 6.500989e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:35,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.66122 samples/s/p 2:07:51 } +2024-07-30 04:00:38,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 823/ 3125], loss: 0.091, per_step_time: 1413ms, lr: 6.497693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:38,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.65875 samples/s/p 2:07:52 } +2024-07-30 04:00:41,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 825/ 3125], loss: 0.179, per_step_time: 1412ms, lr: 6.494396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:41,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.66280 samples/s/p 2:07:44 } +2024-07-30 04:00:44,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 827/ 3125], loss: 0.490, per_step_time: 1413ms, lr: 6.4910982e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:44,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.66111 samples/s/p 2:07:43 } +2024-07-30 04:00:47,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 829/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 6.4878004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:47,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.66157 samples/s/p 2:07:40 } +2024-07-30 04:00:49,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 831/ 3125], loss: 0.435, per_step_time: 1413ms, lr: 6.4845017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:49,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.66135 samples/s/p 2:07:37 } +2024-07-30 04:00:52,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 833/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 6.481202e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:52,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.65966 samples/s/p 2:07:36 } +2024-07-30 04:00:55,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 835/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 6.4779024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:55,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.65968 samples/s/p 2:07:34 } +2024-07-30 04:00:58,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 837/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 6.474601e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:00:58,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.66054 samples/s/p 2:07:30 } +2024-07-30 04:01:01,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 839/ 3125], loss: 0.248, per_step_time: 1414ms, lr: 6.4712985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:01,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.65419 samples/s/p 2:07:35 } +2024-07-30 04:01:04,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 841/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 6.4679966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:04,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.66020 samples/s/p 2:07:24 } +2024-07-30 04:01:06,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 843/ 3125], loss: 0.422, per_step_time: 1414ms, lr: 6.464694e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:06,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.65759 samples/s/p 2:07:25 } +2024-07-30 04:01:09,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 845/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 6.4613905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:09,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.66162 samples/s/p 2:07:17 } +2024-07-30 04:01:12,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 847/ 3125], loss: 0.428, per_step_time: 1414ms, lr: 6.4580854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:12,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.65704 samples/s/p 2:07:20 } +2024-07-30 04:01:15,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 849/ 3125], loss: 0.190, per_step_time: 1414ms, lr: 6.4547808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:15,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.65691 samples/s/p 2:07:18 } +2024-07-30 04:01:18,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 851/ 3125], loss: 0.377, per_step_time: 1414ms, lr: 6.4514747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:18,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.65619 samples/s/p 2:07:16 } +2024-07-30 04:01:21,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 853/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 6.448168e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:21,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.65392 samples/s/p 2:07:16 } +2024-07-30 04:01:23,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 855/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 6.4448614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:23,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.66038 samples/s/p 2:07:04 } +2024-07-30 04:01:26,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 857/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 6.4415535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:26,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.66101 samples/s/p 2:07:01 } +2024-07-30 04:01:29,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 859/ 3125], loss: 0.122, per_step_time: 1413ms, lr: 6.4382443e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:29,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.65929 samples/s/p 2:07:00 } +2024-07-30 04:01:32,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 861/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 6.434935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:32,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.66103 samples/s/p 2:06:55 } +2024-07-30 04:01:35,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 863/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 6.4316255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:35,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.66163 samples/s/p 2:06:51 } +2024-07-30 04:01:38,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 865/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 6.428315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:38,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.65864 samples/s/p 2:06:53 } +2024-07-30 04:01:40,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 867/ 3125], loss: 0.485, per_step_time: 1414ms, lr: 6.425004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:40,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.65714 samples/s/p 2:06:52 } +2024-07-30 04:01:43,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 869/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 6.4216915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:43,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.65825 samples/s/p 2:06:48 } +2024-07-30 04:01:46,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 871/ 3125], loss: 0.200, per_step_time: 1412ms, lr: 6.4183782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:46,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.66187 samples/s/p 2:06:40 } +2024-07-30 04:01:49,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 873/ 3125], loss: 0.219, per_step_time: 1414ms, lr: 6.4150654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:49,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.65692 samples/s/p 2:06:44 } +2024-07-30 04:01:52,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 875/ 3125], loss: 0.493, per_step_time: 1413ms, lr: 6.411751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:52,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.66025 samples/s/p 2:06:36 } +2024-07-30 04:01:55,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 877/ 3125], loss: 0.635, per_step_time: 1413ms, lr: 6.408436e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:55,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.66078 samples/s/p 2:06:33 } +2024-07-30 04:01:57,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 879/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 6.4051214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:01:57,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.66096 samples/s/p 2:06:30 } +2024-07-30 04:02:00,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 881/ 3125], loss: 0.363, per_step_time: 1413ms, lr: 6.401805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:00,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.66055 samples/s/p 2:06:27 } +2024-07-30 04:02:03,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 883/ 3125], loss: 0.295, per_step_time: 1425ms, lr: 6.398488e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:03,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.61103 samples/s/p 2:07:32 } +2024-07-30 04:02:06,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 885/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 6.3951707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:06,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.66109 samples/s/p 2:06:21 } +2024-07-30 04:02:09,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 887/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 6.391853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:09,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.65869 samples/s/p 2:06:21 } +2024-07-30 04:02:12,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 889/ 3125], loss: 0.163, per_step_time: 1417ms, lr: 6.388534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:12,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.64497 samples/s/p 2:06:37 } +2024-07-30 04:02:14,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 891/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 6.385215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:14,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.65901 samples/s/p 2:06:15 } +2024-07-30 04:02:17,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 893/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 6.3818943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:17,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.66016 samples/s/p 2:06:11 } +2024-07-30 04:02:20,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 895/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 6.378574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:20,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.66131 samples/s/p 2:06:07 } +2024-07-30 04:02:23,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 897/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 6.3752523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:23,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.66165 samples/s/p 2:06:03 } +2024-07-30 04:02:26,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 899/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 6.371931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:26,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.65882 samples/s/p 2:06:04 } +2024-07-30 04:02:29,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 901/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 6.3686084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:29,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.66097 samples/s/p 2:05:59 } +2024-07-30 04:02:31,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 903/ 3125], loss: 0.049, per_step_time: 1413ms, lr: 6.3652847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:31,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.66102 samples/s/p 2:05:56 } +2024-07-30 04:02:34,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 905/ 3125], loss: 0.419, per_step_time: 1413ms, lr: 6.36196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:34,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.66105 samples/s/p 2:05:53 } +2024-07-30 04:02:37,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 907/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 6.358636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:37,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.66083 samples/s/p 2:05:50 } +2024-07-30 04:02:40,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 909/ 3125], loss: 0.149, per_step_time: 1426ms, lr: 6.3553107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:40,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.61008 samples/s/p 2:06:56 } +2024-07-30 04:02:43,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 911/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 6.3519847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:43,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.66151 samples/s/p 2:05:44 } +2024-07-30 04:02:46,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 913/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 6.3486586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:46,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.66073 samples/s/p 2:05:42 } +2024-07-30 04:02:48,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 915/ 3125], loss: 0.257, per_step_time: 1412ms, lr: 6.345331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:48,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.66179 samples/s/p 2:05:38 } +2024-07-30 04:02:51,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 917/ 3125], loss: 0.467, per_step_time: 1413ms, lr: 6.342003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:51,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.65839 samples/s/p 2:05:39 } +2024-07-30 04:02:54,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 919/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 6.338674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:54,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.65801 samples/s/p 2:05:37 } +2024-07-30 04:02:57,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 921/ 3125], loss: 0.254, per_step_time: 1412ms, lr: 6.3353455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:02:57,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.66221 samples/s/p 2:05:29 } +2024-07-30 04:03:00,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 923/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 6.332016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:00,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.66094 samples/s/p 2:05:28 } +2024-07-30 04:03:03,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 925/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 6.3286852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:03,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.65954 samples/s/p 2:05:27 } +2024-07-30 04:03:05,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 927/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 6.3253538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:05,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.65957 samples/s/p 2:05:24 } +2024-07-30 04:03:08,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 929/ 3125], loss: 0.325, per_step_time: 1414ms, lr: 6.3220227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:08,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.65669 samples/s/p 2:05:25 } +2024-07-30 04:03:11,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 931/ 3125], loss: 0.215, per_step_time: 1414ms, lr: 6.318691e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:11,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.65744 samples/s/p 2:05:21 } +2024-07-30 04:03:14,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 933/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 6.315357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:14,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.65826 samples/s/p 2:05:17 } +2024-07-30 04:03:17,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 935/ 3125], loss: 0.239, per_step_time: 1414ms, lr: 6.3120237e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:17,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.65573 samples/s/p 2:05:18 } +2024-07-30 04:03:20,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 937/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 6.308689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:20,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.65918 samples/s/p 2:05:10 } +2024-07-30 04:03:22,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 939/ 3125], loss: 0.109, per_step_time: 1412ms, lr: 6.305355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:22,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.66268 samples/s/p 2:05:03 } +2024-07-30 04:03:25,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 941/ 3125], loss: 0.261, per_step_time: 1412ms, lr: 6.3020193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:25,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.66272 samples/s/p 2:05:00 } +2024-07-30 04:03:28,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 943/ 3125], loss: 0.153, per_step_time: 1419ms, lr: 6.2986833e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:28,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.63516 samples/s/p 2:05:34 } +2024-07-30 04:03:31,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 945/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 6.2953472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:31,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.65775 samples/s/p 2:05:01 } +2024-07-30 04:03:34,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 947/ 3125], loss: 0.170, per_step_time: 1418ms, lr: 6.2920094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:34,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.64118 samples/s/p 2:05:20 } +2024-07-30 04:03:37,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 949/ 3125], loss: 0.456, per_step_time: 1413ms, lr: 6.2886706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:37,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.66040 samples/s/p 2:04:52 } +2024-07-30 04:03:39,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 951/ 3125], loss: 0.128, per_step_time: 1412ms, lr: 6.2853323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:39,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.66206 samples/s/p 2:04:47 } +2024-07-30 04:03:42,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 953/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 6.281994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:42,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.65804 samples/s/p 2:04:49 } +2024-07-30 04:03:45,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 955/ 3125], loss: 0.234, per_step_time: 1412ms, lr: 6.2786535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:45,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.66209 samples/s/p 2:04:41 } +2024-07-30 04:03:48,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 957/ 3125], loss: 0.221, per_step_time: 1414ms, lr: 6.2753134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:48,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.65760 samples/s/p 2:04:44 } +2024-07-30 04:03:51,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 959/ 3125], loss: 0.198, per_step_time: 1414ms, lr: 6.2719723e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:51,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.65622 samples/s/p 2:04:43 } +2024-07-30 04:03:54,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 961/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 6.2686304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:54,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.66158 samples/s/p 2:04:33 } +2024-07-30 04:03:56,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 963/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 6.2652884e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:56,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.66090 samples/s/p 2:04:31 } +2024-07-30 04:03:59,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 965/ 3125], loss: 0.207, per_step_time: 1412ms, lr: 6.2619456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:03:59,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.66173 samples/s/p 2:04:27 } +2024-07-30 04:04:02,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 967/ 3125], loss: 0.455, per_step_time: 1413ms, lr: 6.2586028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:02,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.65934 samples/s/p 2:04:28 } +2024-07-30 04:04:05,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 969/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 6.255258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:05,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.66009 samples/s/p 2:04:24 } +2024-07-30 04:04:08,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 971/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 6.2519143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:08,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.66024 samples/s/p 2:04:21 } +2024-07-30 04:04:11,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 973/ 3125], loss: 0.444, per_step_time: 1414ms, lr: 6.2485683e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:11,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.65642 samples/s/p 2:04:23 } +2024-07-30 04:04:13,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 975/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 6.245223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:13,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.66088 samples/s/p 2:04:14 } +2024-07-30 04:04:16,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 977/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 6.2418762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:16,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.66151 samples/s/p 2:04:11 } +2024-07-30 04:04:19,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 979/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 6.2385297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:19,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.66039 samples/s/p 2:04:09 } +2024-07-30 04:04:22,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 981/ 3125], loss: 0.238, per_step_time: 1414ms, lr: 6.2351824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:22,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.65631 samples/s/p 2:04:12 } +2024-07-30 04:04:25,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 983/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 6.2318336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:25,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.65898 samples/s/p 2:04:05 } +2024-07-30 04:04:28,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 985/ 3125], loss: 0.249, per_step_time: 1414ms, lr: 6.228485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:28,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.65492 samples/s/p 2:04:08 } +2024-07-30 04:04:30,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 987/ 3125], loss: 0.120, per_step_time: 1414ms, lr: 6.2251356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:30,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.65732 samples/s/p 2:04:02 } +2024-07-30 04:04:33,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 989/ 3125], loss: 0.135, per_step_time: 1418ms, lr: 6.221786e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:33,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.63943 samples/s/p 2:04:23 } +2024-07-30 04:04:36,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 991/ 3125], loss: 0.239, per_step_time: 1412ms, lr: 6.218435e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:36,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.66231 samples/s/p 2:03:50 } +2024-07-30 04:04:39,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 993/ 3125], loss: 0.431, per_step_time: 1415ms, lr: 6.215085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:39,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.65088 samples/s/p 2:04:02 } +2024-07-30 04:04:42,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 995/ 3125], loss: 0.215, per_step_time: 1417ms, lr: 6.2117324e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:42,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.64343 samples/s/p 2:04:09 } +2024-07-30 04:04:45,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 997/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 6.2083805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:45,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |█████████████████████ | 5.66052 samples/s/p 2:03:44 } +2024-07-30 04:04:48,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 999/ 3125], loss: 0.067, per_step_time: 1413ms, lr: 6.205027e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:48,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |█████████████████████ | 5.66016 samples/s/p 2:03:41 } +2024-07-30 04:04:50,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1001/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 6.2016743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:50,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.65942 samples/s/p 2:03:39 } +2024-07-30 04:04:53,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1003/ 3125], loss: 0.272, per_step_time: 1414ms, lr: 6.19832e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:53,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.65759 samples/s/p 2:03:39 } +2024-07-30 04:04:56,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1005/ 3125], loss: 0.246, per_step_time: 1412ms, lr: 6.194966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:56,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.66189 samples/s/p 2:03:30 } +2024-07-30 04:04:59,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1007/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 6.19161e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:04:59,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.65872 samples/s/p 2:03:32 } +2024-07-30 04:05:02,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1009/ 3125], loss: 0.139, per_step_time: 1413ms, lr: 6.1882547e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:02,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.66046 samples/s/p 2:03:27 } +2024-07-30 04:05:05,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1011/ 3125], loss: 0.428, per_step_time: 1413ms, lr: 6.1848987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:05,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.65852 samples/s/p 2:03:26 } +2024-07-30 04:05:07,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1013/ 3125], loss: 0.426, per_step_time: 1415ms, lr: 6.1815417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:07,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.65144 samples/s/p 2:03:33 } +2024-07-30 04:05:10,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1015/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 6.178185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:10,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.66056 samples/s/p 2:03:18 } +2024-07-30 04:05:13,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1017/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 6.174826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:13,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.65821 samples/s/p 2:03:18 } +2024-07-30 04:05:16,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1019/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 6.1714672e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:16,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.65781 samples/s/p 2:03:16 } +2024-07-30 04:05:19,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1021/ 3125], loss: 0.113, per_step_time: 1413ms, lr: 6.1681085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:19,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.65969 samples/s/p 2:03:11 } +2024-07-30 04:05:22,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1023/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 6.1647493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:22,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.66057 samples/s/p 2:03:07 } +2024-07-30 04:05:24,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1025/ 3125], loss: 0.211, per_step_time: 1414ms, lr: 6.161389e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:24,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.65387 samples/s/p 2:03:13 } +2024-07-30 04:05:27,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1027/ 3125], loss: 0.275, per_step_time: 1414ms, lr: 6.158028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:27,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.65663 samples/s/p 2:03:06 } +2024-07-30 04:05:30,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1029/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 6.1546666e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:30,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.65872 samples/s/p 2:03:01 } +2024-07-30 04:05:33,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1031/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 6.1513047e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:33,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.65917 samples/s/p 2:02:57 } +2024-07-30 04:05:36,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1033/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 6.147943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:36,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.65954 samples/s/p 2:02:54 } +2024-07-30 04:05:39,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1035/ 3125], loss: 0.040, per_step_time: 1412ms, lr: 6.1445794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:39,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.66237 samples/s/p 2:02:47 } +2024-07-30 04:05:41,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1037/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 6.1412165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:41,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.66007 samples/s/p 2:02:48 } +2024-07-30 04:05:44,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1039/ 3125], loss: 0.218, per_step_time: 1412ms, lr: 6.137852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:44,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.66233 samples/s/p 2:02:42 } +2024-07-30 04:05:47,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1041/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 6.134487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:47,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.66137 samples/s/p 2:02:40 } +2024-07-30 04:05:50,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1043/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 6.131122e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:50,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.66040 samples/s/p 2:02:39 } +2024-07-30 04:05:53,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1045/ 3125], loss: 0.229, per_step_time: 1412ms, lr: 6.1277565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:53,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.66188 samples/s/p 2:02:34 } +2024-07-30 04:05:56,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1047/ 3125], loss: 0.124, per_step_time: 1413ms, lr: 6.124391e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:56,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.65980 samples/s/p 2:02:34 } +2024-07-30 04:05:58,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1049/ 3125], loss: 0.225, per_step_time: 1414ms, lr: 6.121024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:05:58,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.65713 samples/s/p 2:02:34 } +2024-07-30 04:06:01,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1051/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 6.117656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:01,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.65856 samples/s/p 2:02:30 } +2024-07-30 04:06:04,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1053/ 3125], loss: 0.331, per_step_time: 1414ms, lr: 6.114288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:04,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.65767 samples/s/p 2:02:28 } +2024-07-30 04:06:07,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1055/ 3125], loss: 0.335, per_step_time: 1412ms, lr: 6.1109204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:07,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.66183 samples/s/p 2:02:20 } +2024-07-30 04:06:10,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1057/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 6.107551e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:10,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.66043 samples/s/p 2:02:19 } +2024-07-30 04:06:13,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1059/ 3125], loss: 0.107, per_step_time: 1412ms, lr: 6.1041824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:13,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.66295 samples/s/p 2:02:13 } +2024-07-30 04:06:15,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1061/ 3125], loss: 0.301, per_step_time: 1412ms, lr: 6.100812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:15,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.66219 samples/s/p 2:02:11 } +2024-07-30 04:06:18,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1063/ 3125], loss: 0.454, per_step_time: 1412ms, lr: 6.097441e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:18,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.66181 samples/s/p 2:02:09 } +2024-07-30 04:06:21,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1065/ 3125], loss: 0.363, per_step_time: 1413ms, lr: 6.0940706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:21,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.66111 samples/s/p 2:02:07 } +2024-07-30 04:06:24,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1067/ 3125], loss: 0.380, per_step_time: 1413ms, lr: 6.090699e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:24,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.65983 samples/s/p 2:02:06 } +2024-07-30 04:06:27,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1069/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 6.0873276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:27,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.65980 samples/s/p 2:02:03 } +2024-07-30 04:06:30,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1071/ 3125], loss: 0.271, per_step_time: 1412ms, lr: 6.083955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:30,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.66204 samples/s/p 2:01:57 } +2024-07-30 04:06:32,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1073/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 6.0805814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:32,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.65979 samples/s/p 2:01:57 } +2024-07-30 04:06:35,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1075/ 3125], loss: 0.729, per_step_time: 1413ms, lr: 6.0772086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:06:35,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.65828 samples/s/p 2:01:56 } +2024-07-30 04:06:35,720 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 04:07:10,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1077/ 3125], loss: 0.403, per_step_time: 1494ms, lr: 6.0738334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:10,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.35329 samples/s/p 2:08:50 } +2024-07-30 04:07:13,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1079/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 6.070459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:13,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.65931 samples/s/p 2:01:49 } +2024-07-30 04:07:16,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1081/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 6.0670845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:16,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.65986 samples/s/p 2:01:46 } +2024-07-30 04:07:18,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1083/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 6.0637085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:18,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.65801 samples/s/p 2:01:45 } +2024-07-30 04:07:21,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1085/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 6.060332e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:21,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.65938 samples/s/p 2:01:41 } +2024-07-30 04:07:24,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1087/ 3125], loss: 0.442, per_step_time: 1414ms, lr: 6.056956e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:24,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.65755 samples/s/p 2:01:40 } +2024-07-30 04:07:27,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1089/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 6.0535785e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:27,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.65875 samples/s/p 2:01:36 } +2024-07-30 04:07:30,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1091/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 6.0502007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:30,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.65911 samples/s/p 2:01:33 } +2024-07-30 04:07:33,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1093/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 6.0468233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:33,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.66099 samples/s/p 2:01:27 } +2024-07-30 04:07:35,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1095/ 3125], loss: 0.273, per_step_time: 1415ms, lr: 6.043444e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:35,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.65039 samples/s/p 2:01:38 } +2024-07-30 04:07:38,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1097/ 3125], loss: 0.269, per_step_time: 1417ms, lr: 6.0400653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:38,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.64529 samples/s/p 2:01:42 } +2024-07-30 04:07:41,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1099/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 6.0366856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:41,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.66165 samples/s/p 2:01:18 } +2024-07-30 04:07:44,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1101/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 6.0333055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:44,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.65991 samples/s/p 2:01:17 } +2024-07-30 04:07:47,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1103/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 6.0299253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:47,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.66099 samples/s/p 2:01:13 } +2024-07-30 04:07:50,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1105/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 6.026544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:50,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.65991 samples/s/p 2:01:12 } +2024-07-30 04:07:52,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1107/ 3125], loss: 0.338, per_step_time: 1414ms, lr: 6.023162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:52,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.65762 samples/s/p 2:01:12 } +2024-07-30 04:07:55,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1109/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 6.01978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:55,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.66154 samples/s/p 2:01:04 } +2024-07-30 04:07:58,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1111/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 6.016398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:07:58,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.66017 samples/s/p 2:01:03 } +2024-07-30 04:08:01,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1113/ 3125], loss: 0.096, per_step_time: 1413ms, lr: 6.013014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:01,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.65830 samples/s/p 2:01:02 } +2024-07-30 04:08:04,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1115/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 6.009631e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:04,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.65966 samples/s/p 2:00:58 } +2024-07-30 04:08:07,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1117/ 3125], loss: 0.078, per_step_time: 1413ms, lr: 6.0062466e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:07,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.66092 samples/s/p 2:00:53 } +2024-07-30 04:08:09,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1119/ 3125], loss: 0.270, per_step_time: 1414ms, lr: 6.0028624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:09,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.65521 samples/s/p 2:00:58 } +2024-07-30 04:08:12,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1121/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 5.9994773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:12,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.66002 samples/s/p 2:00:49 } +2024-07-30 04:08:15,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1123/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 5.9960917e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:15,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.66070 samples/s/p 2:00:45 } +2024-07-30 04:08:18,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1125/ 3125], loss: 0.346, per_step_time: 1415ms, lr: 5.992706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:18,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.65319 samples/s/p 2:00:52 } +2024-07-30 04:08:21,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1127/ 3125], loss: 0.462, per_step_time: 1413ms, lr: 5.9893196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:21,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.65785 samples/s/p 2:00:43 } +2024-07-30 04:08:24,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1129/ 3125], loss: 0.196, per_step_time: 1414ms, lr: 5.985932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:24,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.65717 samples/s/p 2:00:41 } +2024-07-30 04:08:26,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1131/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 5.9825456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:26,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.66008 samples/s/p 2:00:35 } +2024-07-30 04:08:29,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1133/ 3125], loss: 0.263, per_step_time: 1415ms, lr: 5.9791573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:29,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.65345 samples/s/p 2:00:40 } +2024-07-30 04:08:32,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1135/ 3125], loss: 0.382, per_step_time: 1413ms, lr: 5.975769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:32,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.66074 samples/s/p 2:00:28 } +2024-07-30 04:08:35,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1137/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 5.9723807e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:35,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.66049 samples/s/p 2:00:26 } +2024-07-30 04:08:38,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1139/ 3125], loss: 0.242, per_step_time: 1412ms, lr: 5.968991e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:38,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.66192 samples/s/p 2:00:21 } +2024-07-30 04:08:41,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1141/ 3125], loss: 0.280, per_step_time: 1412ms, lr: 5.9656018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:41,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.66246 samples/s/p 2:00:18 } +2024-07-30 04:08:43,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1143/ 3125], loss: 0.434, per_step_time: 1413ms, lr: 5.962211e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:43,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.66005 samples/s/p 2:00:18 } +2024-07-30 04:08:46,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1145/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 5.958821e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:46,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.66124 samples/s/p 2:00:13 } +2024-07-30 04:08:49,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1147/ 3125], loss: 0.402, per_step_time: 1416ms, lr: 5.95543e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:49,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.64876 samples/s/p 2:00:27 } +2024-07-30 04:08:52,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1149/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 5.952038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:52,448 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.66011 samples/s/p 2:00:09 } +2024-07-30 04:08:55,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1151/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 5.948646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:55,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.65901 samples/s/p 2:00:08 } +2024-07-30 04:08:58,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1153/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 5.9452536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:08:58,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.66042 samples/s/p 2:00:03 } +2024-07-30 04:09:00,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1155/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 5.941861e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:00,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.66089 samples/s/p 2:00:00 } +2024-07-30 04:09:03,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1157/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 5.9384674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:03,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.66094 samples/s/p 1:59:57 } +2024-07-30 04:09:06,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1159/ 3125], loss: 0.184, per_step_time: 1414ms, lr: 5.935074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:06,617 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.65760 samples/s/p 1:59:58 } +2024-07-30 04:09:09,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1161/ 3125], loss: 0.220, per_step_time: 1415ms, lr: 5.9316794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:09,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.65318 samples/s/p 2:00:01 } +2024-07-30 04:09:12,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1163/ 3125], loss: 0.257, per_step_time: 1414ms, lr: 5.9282843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:12,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.65560 samples/s/p 1:59:55 } +2024-07-30 04:09:15,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1165/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 5.92489e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:15,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.66039 samples/s/p 1:59:46 } +2024-07-30 04:09:17,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1167/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 5.921494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:17,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.65864 samples/s/p 1:59:46 } +2024-07-30 04:09:20,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1169/ 3125], loss: 0.143, per_step_time: 1415ms, lr: 5.9180984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:20,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.65340 samples/s/p 1:59:50 } +2024-07-30 04:09:23,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1171/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 5.914702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:23,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.66152 samples/s/p 1:59:36 } +2024-07-30 04:09:26,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1173/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 5.911305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:26,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.65607 samples/s/p 1:59:40 } +2024-07-30 04:09:29,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1175/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 5.9079075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:29,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.66056 samples/s/p 1:59:32 } +2024-07-30 04:09:32,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1177/ 3125], loss: 0.103, per_step_time: 1414ms, lr: 5.90451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:32,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.65669 samples/s/p 1:59:34 } +2024-07-30 04:09:34,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1179/ 3125], loss: 0.161, per_step_time: 1412ms, lr: 5.9011118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:34,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.66172 samples/s/p 1:59:25 } +2024-07-30 04:09:37,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1181/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 5.897713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:37,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.66055 samples/s/p 1:59:23 } +2024-07-30 04:09:40,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1183/ 3125], loss: 0.202, per_step_time: 1415ms, lr: 5.8943137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:40,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.65327 samples/s/p 1:59:30 } +2024-07-30 04:09:43,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1185/ 3125], loss: 0.230, per_step_time: 1414ms, lr: 5.890914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:43,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.65603 samples/s/p 1:59:24 } +2024-07-30 04:09:46,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1187/ 3125], loss: 0.055, per_step_time: 1414ms, lr: 5.887515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:46,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.65528 samples/s/p 1:59:22 } +2024-07-30 04:09:49,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1189/ 3125], loss: 0.270, per_step_time: 1414ms, lr: 5.884114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:49,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |███████████████████████ | 5.65457 samples/s/p 1:59:20 } +2024-07-30 04:09:51,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1191/ 3125], loss: 0.289, per_step_time: 1414ms, lr: 5.880714e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:51,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |███████████████████████ | 5.65694 samples/s/p 1:59:14 } +2024-07-30 04:09:54,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1193/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 5.877312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:54,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.65887 samples/s/p 1:59:09 } +2024-07-30 04:09:57,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1195/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 5.8739106e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:09:57,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.66156 samples/s/p 1:59:02 } +2024-07-30 04:10:00,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1197/ 3125], loss: 0.185, per_step_time: 1412ms, lr: 5.870509e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:00,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.66244 samples/s/p 1:58:58 } +2024-07-30 04:10:03,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1199/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 5.867106e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:03,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.66129 samples/s/p 1:58:57 } +2024-07-30 04:10:06,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1201/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 5.863704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:06,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.66094 samples/s/p 1:58:55 } +2024-07-30 04:10:08,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1203/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 5.8603005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:08,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.66006 samples/s/p 1:58:53 } +2024-07-30 04:10:11,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1205/ 3125], loss: 0.396, per_step_time: 1413ms, lr: 5.8568967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:11,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.66153 samples/s/p 1:58:48 } +2024-07-30 04:10:14,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1207/ 3125], loss: 0.055, per_step_time: 1440ms, lr: 5.8534924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:14,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.55214 samples/s/p 2:01:06 } +2024-07-30 04:10:17,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1209/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 5.8500887e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:17,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.66046 samples/s/p 1:58:44 } +2024-07-30 04:10:20,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1211/ 3125], loss: 0.261, per_step_time: 1412ms, lr: 5.846684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:20,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.66174 samples/s/p 1:58:40 } +2024-07-30 04:10:23,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1213/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 5.843279e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:23,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.65861 samples/s/p 1:58:41 } +2024-07-30 04:10:26,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1215/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 5.8398728e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:26,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.66017 samples/s/p 1:58:36 } +2024-07-30 04:10:28,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1217/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 5.8364662e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:28,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.65873 samples/s/p 1:58:35 } +2024-07-30 04:10:31,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1219/ 3125], loss: 0.381, per_step_time: 1413ms, lr: 5.83306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:31,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.66159 samples/s/p 1:58:28 } +2024-07-30 04:10:34,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1221/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 5.829653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:34,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.65980 samples/s/p 1:58:28 } +2024-07-30 04:10:37,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1223/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 5.826246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:37,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.65961 samples/s/p 1:58:25 } +2024-07-30 04:10:40,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1225/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 5.8228384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:40,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.66103 samples/s/p 1:58:21 } +2024-07-30 04:10:43,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1227/ 3125], loss: 0.120, per_step_time: 1413ms, lr: 5.81943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:43,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.65822 samples/s/p 1:58:21 } +2024-07-30 04:10:45,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1229/ 3125], loss: 0.150, per_step_time: 1414ms, lr: 5.8160213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:45,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.65512 samples/s/p 1:58:22 } +2024-07-30 04:10:48,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1231/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 5.8126125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:48,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.65995 samples/s/p 1:58:14 } +2024-07-30 04:10:51,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1233/ 3125], loss: 0.504, per_step_time: 1414ms, lr: 5.8092037e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:51,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.65631 samples/s/p 1:58:15 } +2024-07-30 04:10:54,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1235/ 3125], loss: 0.378, per_step_time: 1415ms, lr: 5.805794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:54,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.65013 samples/s/p 1:58:20 } +2024-07-30 04:10:57,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1237/ 3125], loss: 0.145, per_step_time: 1414ms, lr: 5.8023843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:10:57,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.65441 samples/s/p 1:58:12 } +2024-07-30 04:11:00,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1239/ 3125], loss: 0.475, per_step_time: 1413ms, lr: 5.7989732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:00,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.66041 samples/s/p 1:58:02 } +2024-07-30 04:11:02,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1241/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 5.7955635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:02,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.66085 samples/s/p 1:57:58 } +2024-07-30 04:11:05,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1243/ 3125], loss: 0.288, per_step_time: 1412ms, lr: 5.7921516e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:05,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.66200 samples/s/p 1:57:54 } +2024-07-30 04:11:08,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1245/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 5.7887405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:08,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.66093 samples/s/p 1:57:53 } +2024-07-30 04:11:11,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1247/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 5.7853285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:11,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.66089 samples/s/p 1:57:50 } +2024-07-30 04:11:14,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1249/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 5.781916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:14,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.66087 samples/s/p 1:57:47 } +2024-07-30 04:11:17,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1251/ 3125], loss: 0.234, per_step_time: 1412ms, lr: 5.7785032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:17,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.66186 samples/s/p 1:57:43 } +2024-07-30 04:11:19,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1253/ 3125], loss: 0.485, per_step_time: 1415ms, lr: 5.7750904e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:19,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.65285 samples/s/p 1:57:51 } +2024-07-30 04:11:22,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1255/ 3125], loss: 0.230, per_step_time: 1412ms, lr: 5.7716775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:22,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.66214 samples/s/p 1:57:37 } +2024-07-30 04:11:25,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1257/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 5.7682632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:25,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.65890 samples/s/p 1:57:38 } +2024-07-30 04:11:28,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1259/ 3125], loss: 0.243, per_step_time: 1414ms, lr: 5.7648494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:28,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.65442 samples/s/p 1:57:41 } +2024-07-30 04:11:31,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1261/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 5.7614347e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:31,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.65852 samples/s/p 1:57:33 } +2024-07-30 04:11:34,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1263/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 5.75802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:34,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.65992 samples/s/p 1:57:28 } +2024-07-30 04:11:36,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1265/ 3125], loss: 0.138, per_step_time: 1412ms, lr: 5.754605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:36,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.66232 samples/s/p 1:57:23 } +2024-07-30 04:11:39,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1267/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 5.7511893e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:39,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.65845 samples/s/p 1:57:25 } +2024-07-30 04:11:42,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1269/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 5.7477737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:42,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.65877 samples/s/p 1:57:21 } +2024-07-30 04:11:45,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1271/ 3125], loss: 0.181, per_step_time: 1414ms, lr: 5.7443576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:45,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.65552 samples/s/p 1:57:23 } +2024-07-30 04:11:48,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1273/ 3125], loss: 0.089, per_step_time: 1413ms, lr: 5.7409397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:48,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.66037 samples/s/p 1:57:14 } +2024-07-30 04:11:51,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1275/ 3125], loss: 0.160, per_step_time: 1413ms, lr: 5.737523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:51,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.66137 samples/s/p 1:57:10 } +2024-07-30 04:11:53,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1277/ 3125], loss: 0.148, per_step_time: 1413ms, lr: 5.7341063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:53,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.65893 samples/s/p 1:57:10 } +2024-07-30 04:11:56,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1279/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 5.7306884e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:56,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.65939 samples/s/p 1:57:06 } +2024-07-30 04:11:59,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1281/ 3125], loss: 0.137, per_step_time: 1414ms, lr: 5.7272705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:11:59,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.65548 samples/s/p 1:57:08 } +2024-07-30 04:12:02,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1283/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 5.723852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:02,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.65912 samples/s/p 1:57:01 } +2024-07-30 04:12:05,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1285/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 5.7204334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:05,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.66096 samples/s/p 1:56:56 } +2024-07-30 04:12:08,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1287/ 3125], loss: 0.295, per_step_time: 1414ms, lr: 5.717014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:08,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.65563 samples/s/p 1:57:00 } +2024-07-30 04:12:10,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1289/ 3125], loss: 0.341, per_step_time: 1414ms, lr: 5.713595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:10,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.65439 samples/s/p 1:56:58 } +2024-07-30 04:12:13,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1291/ 3125], loss: 0.583, per_step_time: 1412ms, lr: 5.7101756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:13,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.66230 samples/s/p 1:56:46 } +2024-07-30 04:12:16,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1293/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 5.7067546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:16,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.65787 samples/s/p 1:56:48 } +2024-07-30 04:12:19,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1295/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 5.703335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:19,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.66144 samples/s/p 1:56:41 } +2024-07-30 04:12:22,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1297/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 5.6999133e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:22,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.66065 samples/s/p 1:56:39 } +2024-07-30 04:12:25,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1299/ 3125], loss: 0.402, per_step_time: 1412ms, lr: 5.6964927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:25,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.66210 samples/s/p 1:56:35 } +2024-07-30 04:12:27,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1301/ 3125], loss: 0.448, per_step_time: 1413ms, lr: 5.6930708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:27,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.66105 samples/s/p 1:56:33 } +2024-07-30 04:12:30,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1303/ 3125], loss: 0.185, per_step_time: 1414ms, lr: 5.6896492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:30,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.65411 samples/s/p 1:56:39 } +2024-07-30 04:12:33,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1305/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 5.6862277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:33,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.65846 samples/s/p 1:56:31 } +2024-07-30 04:12:36,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1307/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 5.682805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:36,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.65943 samples/s/p 1:56:27 } +2024-07-30 04:12:39,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1309/ 3125], loss: 0.323, per_step_time: 1413ms, lr: 5.679382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:39,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.66159 samples/s/p 1:56:21 } +2024-07-30 04:12:42,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1311/ 3125], loss: 0.169, per_step_time: 1413ms, lr: 5.675959e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:42,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.66060 samples/s/p 1:56:20 } +2024-07-30 04:12:44,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1313/ 3125], loss: 0.169, per_step_time: 1413ms, lr: 5.6725357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:44,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.66032 samples/s/p 1:56:17 } +2024-07-30 04:12:47,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1315/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 5.669112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:47,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.66093 samples/s/p 1:56:14 } +2024-07-30 04:12:50,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1317/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 5.665688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:50,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.66126 samples/s/p 1:56:10 } +2024-07-30 04:12:53,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1319/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 5.6622634e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:53,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.65955 samples/s/p 1:56:10 } +2024-07-30 04:12:56,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1321/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 5.658839e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:56,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.65984 samples/s/p 1:56:06 } +2024-07-30 04:12:59,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1323/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 5.6554136e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:12:59,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.65870 samples/s/p 1:56:05 } +2024-07-30 04:13:01,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1325/ 3125], loss: 0.387, per_step_time: 1413ms, lr: 5.651989e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:01,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.65795 samples/s/p 1:56:03 } +2024-07-30 04:13:04,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1327/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 5.6485633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:04,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.65951 samples/s/p 1:55:58 } +2024-07-30 04:13:07,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1329/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 5.645137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:07,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.66007 samples/s/p 1:55:55 } +2024-07-30 04:13:10,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1331/ 3125], loss: 0.310, per_step_time: 1415ms, lr: 5.6417107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:10,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.65029 samples/s/p 1:56:04 } +2024-07-30 04:13:13,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1333/ 3125], loss: 0.272, per_step_time: 1414ms, lr: 5.6382846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:13,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.65504 samples/s/p 1:55:55 } +2024-07-30 04:13:16,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1335/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 5.6348576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:16,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.65898 samples/s/p 1:55:48 } +2024-07-30 04:13:18,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1337/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 5.63143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:18,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.65882 samples/s/p 1:55:45 } +2024-07-30 04:13:21,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1339/ 3125], loss: 0.309, per_step_time: 1412ms, lr: 5.6280032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:21,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.66261 samples/s/p 1:55:38 } +2024-07-30 04:13:24,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1341/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 5.624575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:24,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.66037 samples/s/p 1:55:38 } +2024-07-30 04:13:27,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1343/ 3125], loss: 0.159, per_step_time: 1414ms, lr: 5.621147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:27,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.65733 samples/s/p 1:55:38 } +2024-07-30 04:13:30,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1345/ 3125], loss: 0.167, per_step_time: 1414ms, lr: 5.6177187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:30,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.65731 samples/s/p 1:55:36 } +2024-07-30 04:13:33,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1347/ 3125], loss: 0.235, per_step_time: 1414ms, lr: 5.61429e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:33,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.65611 samples/s/p 1:55:34 } +2024-07-30 04:13:35,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1349/ 3125], loss: 0.205, per_step_time: 1414ms, lr: 5.6108615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:35,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.65744 samples/s/p 1:55:30 } +2024-07-30 04:13:38,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1351/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 5.607432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:38,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.65897 samples/s/p 1:55:25 } +2024-07-30 04:13:41,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1353/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 5.604002e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:41,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.65884 samples/s/p 1:55:22 } +2024-07-30 04:13:44,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1355/ 3125], loss: 0.400, per_step_time: 1412ms, lr: 5.600573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:44,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.66257 samples/s/p 1:55:15 } +2024-07-30 04:13:47,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1357/ 3125], loss: 0.158, per_step_time: 1413ms, lr: 5.597143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:47,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.65940 samples/s/p 1:55:16 } +2024-07-30 04:13:50,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1359/ 3125], loss: 0.180, per_step_time: 1414ms, lr: 5.593712e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:50,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.65379 samples/s/p 1:55:20 } +2024-07-30 04:13:52,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1361/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 5.590282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:52,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.66108 samples/s/p 1:55:08 } +2024-07-30 04:13:55,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1363/ 3125], loss: 0.232, per_step_time: 1414ms, lr: 5.5868504e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:55,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.65581 samples/s/p 1:55:12 } +2024-07-30 04:13:58,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1365/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 5.583419e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:13:58,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.66123 samples/s/p 1:55:03 } +2024-07-30 04:14:01,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1367/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 5.579988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:01,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.66082 samples/s/p 1:55:00 } +2024-07-30 04:14:04,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1369/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 5.5765563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:04,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.66052 samples/s/p 1:54:58 } +2024-07-30 04:14:07,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1371/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 5.5731243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:07,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |███████████████████████ | 5.66169 samples/s/p 1:54:54 } +2024-07-30 04:14:09,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1373/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 5.5696914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:09,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |███████████████████████ | 5.66034 samples/s/p 1:54:52 } +2024-07-30 04:14:12,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1375/ 3125], loss: 0.419, per_step_time: 1412ms, lr: 5.566259e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:12,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.66191 samples/s/p 1:54:48 } +2024-07-30 04:14:15,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1377/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 5.562826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:15,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.65966 samples/s/p 1:54:48 } +2024-07-30 04:14:18,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1379/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 5.5593937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:18,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.66120 samples/s/p 1:54:43 } +2024-07-30 04:14:21,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1381/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 5.55596e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:21,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.65836 samples/s/p 1:54:43 } +2024-07-30 04:14:24,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1383/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 5.5525265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:24,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.65829 samples/s/p 1:54:41 } +2024-07-30 04:14:26,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1385/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 5.5490923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:26,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.65821 samples/s/p 1:54:38 } +2024-07-30 04:14:29,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1387/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 5.5456576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:29,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.65963 samples/s/p 1:54:33 } +2024-07-30 04:14:32,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1389/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 5.5422233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:32,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.66052 samples/s/p 1:54:30 } +2024-07-30 04:14:35,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1391/ 3125], loss: 0.410, per_step_time: 1414ms, lr: 5.538789e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:35,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.65760 samples/s/p 1:54:30 } +2024-07-30 04:14:38,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1393/ 3125], loss: 0.129, per_step_time: 1414ms, lr: 5.5353544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:38,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.65717 samples/s/p 1:54:28 } +2024-07-30 04:14:41,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1395/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 5.5319188e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:41,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.65962 samples/s/p 1:54:22 } +2024-07-30 04:14:43,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1397/ 3125], loss: 0.091, per_step_time: 1414ms, lr: 5.5284827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:43,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.65720 samples/s/p 1:54:22 } +2024-07-30 04:14:46,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1399/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 5.5250475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:46,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.65827 samples/s/p 1:54:18 } +2024-07-30 04:14:49,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1401/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 5.521611e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:49,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.65818 samples/s/p 1:54:15 } +2024-07-30 04:14:52,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1403/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 5.5181754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:52,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.66003 samples/s/p 1:54:10 } +2024-07-30 04:14:55,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1405/ 3125], loss: 0.088, per_step_time: 1413ms, lr: 5.514739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:55,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.65992 samples/s/p 1:54:08 } +2024-07-30 04:14:58,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1407/ 3125], loss: 0.266, per_step_time: 1414ms, lr: 5.5113014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:14:58,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.65725 samples/s/p 1:54:08 } +2024-07-30 04:15:00,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1409/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 5.507865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:00,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.65865 samples/s/p 1:54:04 } +2024-07-30 04:15:03,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1411/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 5.5044275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:03,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.66041 samples/s/p 1:53:59 } +2024-07-30 04:15:06,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1413/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 5.5009905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:06,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.66110 samples/s/p 1:53:55 } +2024-07-30 04:15:09,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1415/ 3125], loss: 0.205, per_step_time: 1414ms, lr: 5.497553e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:09,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.65684 samples/s/p 1:53:57 } +2024-07-30 04:15:12,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1417/ 3125], loss: 0.527, per_step_time: 1413ms, lr: 5.4941147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:12,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.66018 samples/s/p 1:53:50 } +2024-07-30 04:15:15,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1419/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 5.490676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:15,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.66167 samples/s/p 1:53:46 } +2024-07-30 04:15:17,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1421/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 5.487238e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:17,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.65927 samples/s/p 1:53:46 } +2024-07-30 04:15:20,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1423/ 3125], loss: 0.402, per_step_time: 1414ms, lr: 5.483799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:20,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.65717 samples/s/p 1:53:46 } +2024-07-30 04:15:23,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1425/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 5.480361e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:23,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.65924 samples/s/p 1:53:40 } +2024-07-30 04:15:26,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1427/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 5.4769216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:26,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.65894 samples/s/p 1:53:38 } +2024-07-30 04:15:29,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1429/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 5.4734824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:29,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.65810 samples/s/p 1:53:36 } +2024-07-30 04:15:32,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1431/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 5.470042e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:32,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.66146 samples/s/p 1:53:29 } +2024-07-30 04:15:34,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1433/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 5.466603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:34,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.66136 samples/s/p 1:53:26 } +2024-07-30 04:15:37,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1435/ 3125], loss: 0.118, per_step_time: 1412ms, lr: 5.4631632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:37,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.66186 samples/s/p 1:53:23 } +2024-07-30 04:15:40,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1437/ 3125], loss: 0.206, per_step_time: 1412ms, lr: 5.4597226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:40,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.66172 samples/s/p 1:53:20 } +2024-07-30 04:15:43,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1439/ 3125], loss: 0.162, per_step_time: 1412ms, lr: 5.4562825e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:43,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.66182 samples/s/p 1:53:17 } +2024-07-30 04:15:46,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1441/ 3125], loss: 0.353, per_step_time: 1413ms, lr: 5.4528414e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:46,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.66170 samples/s/p 1:53:15 } +2024-07-30 04:15:49,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1443/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 5.449401e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:49,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.65843 samples/s/p 1:53:16 } +2024-07-30 04:15:51,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1445/ 3125], loss: 0.317, per_step_time: 1415ms, lr: 5.4459592e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:51,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.65171 samples/s/p 1:53:21 } +2024-07-30 04:15:54,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1447/ 3125], loss: 0.117, per_step_time: 1414ms, lr: 5.4425186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:54,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.65631 samples/s/p 1:53:13 } +2024-07-30 04:15:57,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1449/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 5.4390775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:15:57,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.65921 samples/s/p 1:53:06 } +2024-07-30 04:16:00,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1451/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 5.435635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:00,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.66082 samples/s/p 1:53:02 } +2024-07-30 04:16:03,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1453/ 3125], loss: 0.465, per_step_time: 1415ms, lr: 5.432193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:03,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.65159 samples/s/p 1:53:10 } +2024-07-30 04:16:06,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1455/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 5.428751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:06,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.66078 samples/s/p 1:52:56 } +2024-07-30 04:16:09,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1457/ 3125], loss: 0.395, per_step_time: 1414ms, lr: 5.4253087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:09,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.65666 samples/s/p 1:52:58 } +2024-07-30 04:16:11,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1459/ 3125], loss: 0.303, per_step_time: 1412ms, lr: 5.4218663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:11,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.66188 samples/s/p 1:52:49 } +2024-07-30 04:16:14,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1461/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 5.418424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:14,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.66087 samples/s/p 1:52:47 } +2024-07-30 04:16:17,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1463/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 5.4149805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:17,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.65826 samples/s/p 1:52:48 } +2024-07-30 04:16:20,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1465/ 3125], loss: 0.274, per_step_time: 1412ms, lr: 5.4115376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:20,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.66173 samples/s/p 1:52:41 } +2024-07-30 04:16:23,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1467/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 5.408094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:23,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.66104 samples/s/p 1:52:39 } +2024-07-30 04:16:26,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1469/ 3125], loss: 0.137, per_step_time: 1414ms, lr: 5.4046504e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:26,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.65628 samples/s/p 1:52:42 } +2024-07-30 04:16:28,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1471/ 3125], loss: 0.181, per_step_time: 1414ms, lr: 5.401207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:28,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.65531 samples/s/p 1:52:40 } +2024-07-30 04:16:31,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1473/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 5.3977633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:31,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.65875 samples/s/p 1:52:33 } +2024-07-30 04:16:34,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1475/ 3125], loss: 0.199, per_step_time: 1412ms, lr: 5.3943186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:34,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.66247 samples/s/p 1:52:26 } +2024-07-30 04:16:37,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1477/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 5.390875e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:37,347 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.65999 samples/s/p 1:52:26 } +2024-07-30 04:16:40,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1479/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 5.38743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:40,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.65842 samples/s/p 1:52:25 } +2024-07-30 04:16:43,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1481/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 5.3839854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:43,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.65893 samples/s/p 1:52:21 } +2024-07-30 04:16:45,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1483/ 3125], loss: 0.105, per_step_time: 1413ms, lr: 5.380541e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:45,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.65815 samples/s/p 1:52:20 } +2024-07-30 04:16:48,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1485/ 3125], loss: 0.235, per_step_time: 1413ms, lr: 5.377095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:48,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.65788 samples/s/p 1:52:17 } +2024-07-30 04:16:51,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1487/ 3125], loss: 0.394, per_step_time: 1413ms, lr: 5.3736508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:51,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.66121 samples/s/p 1:52:10 } +2024-07-30 04:16:54,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1489/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 5.3702047e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:54,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.66081 samples/s/p 1:52:08 } +2024-07-30 04:16:57,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1491/ 3125], loss: 0.266, per_step_time: 1412ms, lr: 5.366759e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:16:57,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.66266 samples/s/p 1:52:03 } +2024-07-30 04:17:00,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1493/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 5.363314e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:00,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.65954 samples/s/p 1:52:04 } +2024-07-30 04:17:02,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1495/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 5.359868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:02,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.65983 samples/s/p 1:52:01 } +2024-07-30 04:17:05,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1497/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 5.3564213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:05,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.65968 samples/s/p 1:51:58 } +2024-07-30 04:17:08,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1499/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 5.3529757e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:08,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.65976 samples/s/p 1:51:55 } +2024-07-30 04:17:11,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1501/ 3125], loss: 0.433, per_step_time: 1412ms, lr: 5.349529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:11,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.66218 samples/s/p 1:51:49 } +2024-07-30 04:17:14,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1503/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 5.346082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:14,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.66077 samples/s/p 1:51:48 } +2024-07-30 04:17:17,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1505/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 5.342636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:17,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.66011 samples/s/p 1:51:46 } +2024-07-30 04:17:19,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1507/ 3125], loss: 0.189, per_step_time: 1415ms, lr: 5.3391886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:19,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.65036 samples/s/p 1:51:55 } +2024-07-30 04:17:22,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1509/ 3125], loss: 0.314, per_step_time: 1414ms, lr: 5.3357408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:22,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.65616 samples/s/p 1:51:45 } +2024-07-30 04:17:25,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1511/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 5.3322938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:25,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.66110 samples/s/p 1:51:36 } +2024-07-30 04:17:28,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1513/ 3125], loss: 0.266, per_step_time: 1414ms, lr: 5.3288472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:28,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.65699 samples/s/p 1:51:38 } +2024-07-30 04:17:31,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1515/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 5.3253993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:31,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.65873 samples/s/p 1:51:34 } +2024-07-30 04:17:34,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1517/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 5.321952e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:34,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.65952 samples/s/p 1:51:30 } +2024-07-30 04:17:36,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1519/ 3125], loss: 0.241, per_step_time: 1412ms, lr: 5.318504e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:36,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.66282 samples/s/p 1:51:23 } +2024-07-30 04:17:39,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1521/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 5.3150557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:39,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.66085 samples/s/p 1:51:23 } +2024-07-30 04:17:42,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1523/ 3125], loss: 0.315, per_step_time: 1412ms, lr: 5.311608e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:42,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.66183 samples/s/p 1:51:19 } +2024-07-30 04:17:45,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1525/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 5.3081594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:45,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.66031 samples/s/p 1:51:18 } +2024-07-30 04:17:48,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1527/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 5.3047115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:48,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.66059 samples/s/p 1:51:14 } +2024-07-30 04:17:51,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1529/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 5.301262e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:51,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.66039 samples/s/p 1:51:12 } +2024-07-30 04:17:53,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1531/ 3125], loss: 0.126, per_step_time: 1412ms, lr: 5.2978135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:53,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.66297 samples/s/p 1:51:06 } +2024-07-30 04:17:56,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1533/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 5.2943647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:56,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.65865 samples/s/p 1:51:08 } +2024-07-30 04:17:59,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1535/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 5.290916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:17:59,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.66008 samples/s/p 1:51:04 } +2024-07-30 04:18:02,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1537/ 3125], loss: 0.267, per_step_time: 1414ms, lr: 5.287467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:02,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.65678 samples/s/p 1:51:05 } +2024-07-30 04:18:05,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1539/ 3125], loss: 0.230, per_step_time: 1414ms, lr: 5.2840173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:05,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.65735 samples/s/p 1:51:01 } +2024-07-30 04:18:08,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1541/ 3125], loss: 0.258, per_step_time: 1412ms, lr: 5.280567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:08,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.66253 samples/s/p 1:50:52 } +2024-07-30 04:18:10,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1543/ 3125], loss: 0.397, per_step_time: 1414ms, lr: 5.277118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:10,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.65502 samples/s/p 1:50:58 } +2024-07-30 04:18:13,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1545/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 5.2736686e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:13,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.66062 samples/s/p 1:50:49 } +2024-07-30 04:18:16,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1547/ 3125], loss: 0.203, per_step_time: 1412ms, lr: 5.270219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:16,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.66189 samples/s/p 1:50:45 } +2024-07-30 04:18:19,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1549/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 5.2667688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:19,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.65864 samples/s/p 1:50:46 } +2024-07-30 04:18:22,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1551/ 3125], loss: 0.416, per_step_time: 1414ms, lr: 5.263318e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:22,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.65506 samples/s/p 1:50:47 } +2024-07-30 04:18:25,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1553/ 3125], loss: 0.129, per_step_time: 1413ms, lr: 5.259868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:25,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.65776 samples/s/p 1:50:41 } +2024-07-30 04:18:27,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1555/ 3125], loss: 0.323, per_step_time: 1414ms, lr: 5.256418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:27,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.65478 samples/s/p 1:50:42 } +2024-07-30 04:18:30,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1557/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 5.252967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:30,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.66153 samples/s/p 1:50:31 } +2024-07-30 04:18:33,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1559/ 3125], loss: 0.420, per_step_time: 1413ms, lr: 5.2495175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:33,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |████████████████████████ | 5.65874 samples/s/p 1:50:31 } +2024-07-30 04:18:36,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1561/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 5.2460664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:36,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |████████████████████████ | 5.65794 samples/s/p 1:50:29 } +2024-07-30 04:18:39,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1563/ 3125], loss: 0.212, per_step_time: 1414ms, lr: 5.2426153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:39,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.65443 samples/s/p 1:50:31 } +2024-07-30 04:18:42,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1565/ 3125], loss: 0.401, per_step_time: 1413ms, lr: 5.2391642e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:42,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.65800 samples/s/p 1:50:24 } +2024-07-30 04:18:44,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1567/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 5.235713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:44,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.66069 samples/s/p 1:50:18 } +2024-07-30 04:18:47,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1569/ 3125], loss: 0.161, per_step_time: 1415ms, lr: 5.232262e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:47,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.65296 samples/s/p 1:50:24 } +2024-07-30 04:18:50,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1571/ 3125], loss: 0.227, per_step_time: 1412ms, lr: 5.2288115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:50,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.66307 samples/s/p 1:50:09 } +2024-07-30 04:18:53,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1573/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 5.225359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:53,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.65980 samples/s/p 1:50:10 } +2024-07-30 04:18:56,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1575/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 5.2219075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:56,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.66079 samples/s/p 1:50:06 } +2024-07-30 04:18:59,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1577/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 5.2184564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:18:59,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.65863 samples/s/p 1:50:06 } +2024-07-30 04:19:01,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1579/ 3125], loss: 0.439, per_step_time: 1414ms, lr: 5.2150044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:01,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.65578 samples/s/p 1:50:07 } +2024-07-30 04:19:04,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1581/ 3125], loss: 0.413, per_step_time: 1412ms, lr: 5.2115533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:04,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.66216 samples/s/p 1:49:56 } +2024-07-30 04:19:07,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1583/ 3125], loss: 0.246, per_step_time: 1412ms, lr: 5.2081014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:07,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.66253 samples/s/p 1:49:53 } +2024-07-30 04:19:10,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1585/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 5.204649e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:10,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.65992 samples/s/p 1:49:53 } +2024-07-30 04:19:13,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1587/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 5.2011965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:13,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.66100 samples/s/p 1:49:49 } +2024-07-30 04:19:16,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1589/ 3125], loss: 0.198, per_step_time: 1416ms, lr: 5.197744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:16,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.64735 samples/s/p 1:50:02 } +2024-07-30 04:19:18,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1591/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 5.1942925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:18,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.66012 samples/s/p 1:49:45 } +2024-07-30 04:19:21,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1593/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 5.19084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:21,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.66031 samples/s/p 1:49:41 } +2024-07-30 04:19:24,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1595/ 3125], loss: 0.381, per_step_time: 1412ms, lr: 5.187388e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:24,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.66299 samples/s/p 1:49:36 } +2024-07-30 04:19:27,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1597/ 3125], loss: 0.323, per_step_time: 1414ms, lr: 5.1839343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:27,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.65535 samples/s/p 1:49:42 } +2024-07-30 04:19:30,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1599/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 5.1804823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:30,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.66159 samples/s/p 1:49:32 } +2024-07-30 04:19:33,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1601/ 3125], loss: 0.433, per_step_time: 1413ms, lr: 5.17703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:33,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.66011 samples/s/p 1:49:30 } +2024-07-30 04:19:35,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1603/ 3125], loss: 0.372, per_step_time: 1414ms, lr: 5.1735765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:35,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.65528 samples/s/p 1:49:33 } +2024-07-30 04:19:38,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1605/ 3125], loss: 0.489, per_step_time: 1412ms, lr: 5.170124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:38,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.66370 samples/s/p 1:49:21 } +2024-07-30 04:19:41,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1607/ 3125], loss: 0.258, per_step_time: 1414ms, lr: 5.166671e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:41,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.65688 samples/s/p 1:49:26 } +2024-07-30 04:19:44,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1609/ 3125], loss: 0.203, per_step_time: 1414ms, lr: 5.163218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:44,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.65578 samples/s/p 1:49:24 } +2024-07-30 04:19:47,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1611/ 3125], loss: 0.286, per_step_time: 1414ms, lr: 5.159764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:47,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.65690 samples/s/p 1:49:20 } +2024-07-30 04:19:50,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1613/ 3125], loss: 0.345, per_step_time: 1414ms, lr: 5.156311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:50,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.65577 samples/s/p 1:49:18 } +2024-07-30 04:19:52,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1615/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 5.152858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:52,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.65803 samples/s/p 1:49:13 } +2024-07-30 04:19:55,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1617/ 3125], loss: 0.555, per_step_time: 1413ms, lr: 5.149405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:55,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.66134 samples/s/p 1:49:06 } +2024-07-30 04:19:58,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1619/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 5.1459515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:19:58,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.66098 samples/s/p 1:49:04 } +2024-07-30 04:20:01,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1621/ 3125], loss: 0.141, per_step_time: 1412ms, lr: 5.1424972e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:01,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.66216 samples/s/p 1:49:00 } +2024-07-30 04:20:04,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1623/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 5.1390443e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:04,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.65966 samples/s/p 1:49:00 } +2024-07-30 04:20:07,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1625/ 3125], loss: 0.078, per_step_time: 1417ms, lr: 5.1355905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:07,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.64371 samples/s/p 1:49:15 } +2024-07-30 04:20:09,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1627/ 3125], loss: 0.106, per_step_time: 1414ms, lr: 5.1321367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:09,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.65595 samples/s/p 1:48:58 } +2024-07-30 04:20:12,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1629/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 5.1286834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:12,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.65822 samples/s/p 1:48:53 } +2024-07-30 04:20:15,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1631/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 5.125229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:15,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.66060 samples/s/p 1:48:47 } +2024-07-30 04:20:18,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1633/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 5.1217744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:18,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.66092 samples/s/p 1:48:44 } +2024-07-30 04:20:21,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1635/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 5.118321e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:21,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.65827 samples/s/p 1:48:44 } +2024-07-30 04:20:24,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1637/ 3125], loss: 0.503, per_step_time: 1413ms, lr: 5.1148677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:24,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.65910 samples/s/p 1:48:41 } +2024-07-30 04:20:26,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1639/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 5.111413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:26,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.66072 samples/s/p 1:48:36 } +2024-07-30 04:20:29,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1641/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 5.107959e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:29,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.65924 samples/s/p 1:48:35 } +2024-07-30 04:20:32,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1643/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 5.104505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:32,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.66028 samples/s/p 1:48:31 } +2024-07-30 04:20:35,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1645/ 3125], loss: 0.326, per_step_time: 1412ms, lr: 5.1010506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:35,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.66177 samples/s/p 1:48:26 } +2024-07-30 04:20:38,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1647/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 5.097596e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:38,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.66094 samples/s/p 1:48:24 } +2024-07-30 04:20:41,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1649/ 3125], loss: 0.307, per_step_time: 1412ms, lr: 5.0941417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:41,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.66176 samples/s/p 1:48:21 } +2024-07-30 04:20:43,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1651/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 5.090688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:43,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.66082 samples/s/p 1:48:19 } +2024-07-30 04:20:46,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1653/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 5.087233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:46,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.66124 samples/s/p 1:48:16 } +2024-07-30 04:20:49,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1655/ 3125], loss: 0.417, per_step_time: 1413ms, lr: 5.0837784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:49,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.65887 samples/s/p 1:48:15 } +2024-07-30 04:20:52,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1657/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 5.080324e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:52,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.65967 samples/s/p 1:48:12 } +2024-07-30 04:20:55,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1659/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 5.0768704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:55,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.66003 samples/s/p 1:48:09 } +2024-07-30 04:20:58,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1661/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 5.0734147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:20:58,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.65959 samples/s/p 1:48:06 } +2024-07-30 04:21:00,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1663/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 5.069961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:00,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.66055 samples/s/p 1:48:02 } +2024-07-30 04:21:03,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1665/ 3125], loss: 0.072, per_step_time: 1413ms, lr: 5.0665058e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:03,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.65858 samples/s/p 1:48:02 } +2024-07-30 04:21:06,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1667/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 5.0630515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:06,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.65948 samples/s/p 1:47:58 } +2024-07-30 04:21:09,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1669/ 3125], loss: 0.248, per_step_time: 1414ms, lr: 5.0595963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:09,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.65729 samples/s/p 1:47:58 } +2024-07-30 04:21:12,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1671/ 3125], loss: 0.339, per_step_time: 1414ms, lr: 5.056142e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:12,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.65753 samples/s/p 1:47:54 } +2024-07-30 04:21:15,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1673/ 3125], loss: 0.259, per_step_time: 1415ms, lr: 5.0526874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:15,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.65148 samples/s/p 1:47:59 } +2024-07-30 04:21:17,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1675/ 3125], loss: 0.445, per_step_time: 1413ms, lr: 5.049232e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:17,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.65856 samples/s/p 1:47:48 } +2024-07-30 04:21:20,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1677/ 3125], loss: 0.251, per_step_time: 1415ms, lr: 5.0457775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:20,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.65315 samples/s/p 1:47:51 } +2024-07-30 04:21:23,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1679/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 5.0423228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:23,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.66131 samples/s/p 1:47:39 } +2024-07-30 04:21:26,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1681/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 5.038868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:26,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.66075 samples/s/p 1:47:37 } +2024-07-30 04:21:29,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1683/ 3125], loss: 0.127, per_step_time: 1413ms, lr: 5.035413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:29,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.66143 samples/s/p 1:47:33 } +2024-07-30 04:21:32,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1685/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 5.031958e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:32,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.65954 samples/s/p 1:47:32 } +2024-07-30 04:21:34,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1687/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 5.028503e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:34,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.65946 samples/s/p 1:47:30 } +2024-07-30 04:21:37,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1689/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 5.0250483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:37,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.65773 samples/s/p 1:47:29 } +2024-07-30 04:21:40,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1691/ 3125], loss: 0.229, per_step_time: 1412ms, lr: 5.0215936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:40,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.66256 samples/s/p 1:47:20 } +2024-07-30 04:21:43,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1693/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 5.018139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:43,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.66047 samples/s/p 1:47:20 } +2024-07-30 04:21:46,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1695/ 3125], loss: 0.254, per_step_time: 1414ms, lr: 5.014684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:46,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.65553 samples/s/p 1:47:23 } +2024-07-30 04:21:49,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1697/ 3125], loss: 0.421, per_step_time: 1413ms, lr: 5.011229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:49,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.65912 samples/s/p 1:47:16 } +2024-07-30 04:21:51,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1699/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 5.0077733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:51,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.66026 samples/s/p 1:47:12 } +2024-07-30 04:21:54,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1701/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 5.0043186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:54,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.66090 samples/s/p 1:47:08 } +2024-07-30 04:21:57,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1703/ 3125], loss: 0.478, per_step_time: 1413ms, lr: 5.0008643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:21:57,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.66028 samples/s/p 1:47:06 } +2024-07-30 04:22:00,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1705/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 4.997409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:00,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.65876 samples/s/p 1:47:05 } +2024-07-30 04:22:03,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1707/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 4.993954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:03,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.66132 samples/s/p 1:46:59 } +2024-07-30 04:22:06,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1709/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 4.9904984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:06,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.65782 samples/s/p 1:47:00 } +2024-07-30 04:22:08,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1711/ 3125], loss: 0.178, per_step_time: 1412ms, lr: 4.987043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:08,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.66310 samples/s/p 1:46:52 } +2024-07-30 04:22:11,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1713/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 4.9835885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:11,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.66055 samples/s/p 1:46:52 } +2024-07-30 04:22:14,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1715/ 3125], loss: 0.193, per_step_time: 1412ms, lr: 4.980134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:14,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.66326 samples/s/p 1:46:46 } +2024-07-30 04:22:17,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1717/ 3125], loss: 0.197, per_step_time: 1414ms, lr: 4.9766795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:17,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.65687 samples/s/p 1:46:50 } +2024-07-30 04:22:20,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1719/ 3125], loss: 0.306, per_step_time: 1412ms, lr: 4.9732243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:20,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.66186 samples/s/p 1:46:42 } +2024-07-30 04:22:23,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1721/ 3125], loss: 0.137, per_step_time: 1413ms, lr: 4.9697696e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:23,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.65978 samples/s/p 1:46:41 } +2024-07-30 04:22:25,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1723/ 3125], loss: 0.300, per_step_time: 1414ms, lr: 4.9663136e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:25,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.65453 samples/s/p 1:46:44 } +2024-07-30 04:22:28,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1725/ 3125], loss: 0.293, per_step_time: 1413ms, lr: 4.962859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:28,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.65813 samples/s/p 1:46:37 } +2024-07-30 04:22:31,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1727/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 4.9594046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:31,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.66144 samples/s/p 1:46:31 } +2024-07-30 04:22:34,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1729/ 3125], loss: 0.349, per_step_time: 1413ms, lr: 4.95595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:34,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.66131 samples/s/p 1:46:28 } +2024-07-30 04:22:37,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1731/ 3125], loss: 0.312, per_step_time: 1414ms, lr: 4.952495e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:37,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.65769 samples/s/p 1:46:29 } +2024-07-30 04:22:40,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1733/ 3125], loss: 0.057, per_step_time: 1413ms, lr: 4.9490404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:40,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.65986 samples/s/p 1:46:24 } +2024-07-30 04:22:42,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1735/ 3125], loss: 0.251, per_step_time: 1414ms, lr: 4.9455857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:42,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.65622 samples/s/p 1:46:25 } +2024-07-30 04:22:45,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1737/ 3125], loss: 0.193, per_step_time: 1415ms, lr: 4.9421305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:45,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.65356 samples/s/p 1:46:26 } +2024-07-30 04:22:48,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1739/ 3125], loss: 0.235, per_step_time: 1413ms, lr: 4.938676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:48,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.66011 samples/s/p 1:46:15 } +2024-07-30 04:22:51,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1741/ 3125], loss: 0.430, per_step_time: 1412ms, lr: 4.935221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:51,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.66218 samples/s/p 1:46:10 } +2024-07-30 04:22:54,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1743/ 3125], loss: 0.451, per_step_time: 1412ms, lr: 4.9317664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:54,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.66203 samples/s/p 1:46:08 } +2024-07-30 04:22:57,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1745/ 3125], loss: 0.326, per_step_time: 1412ms, lr: 4.928312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:57,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.66211 samples/s/p 1:46:05 } +2024-07-30 04:22:59,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1747/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 4.924858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:22:59,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |█████████████████████████ | 5.66102 samples/s/p 1:46:03 } +2024-07-30 04:23:02,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1749/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 4.9214036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:02,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |█████████████████████████ | 5.66085 samples/s/p 1:46:00 } +2024-07-30 04:23:05,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1751/ 3125], loss: 0.166, per_step_time: 1412ms, lr: 4.917948e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:05,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.66177 samples/s/p 1:45:57 } +2024-07-30 04:23:08,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1753/ 3125], loss: 0.163, per_step_time: 1414ms, lr: 4.9144937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:08,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.65717 samples/s/p 1:45:59 } +2024-07-30 04:23:11,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1755/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 4.911039e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:11,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.65859 samples/s/p 1:45:54 } +2024-07-30 04:23:14,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1757/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 4.9075848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:14,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.65423 samples/s/p 1:45:57 } +2024-07-30 04:23:16,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1759/ 3125], loss: 0.143, per_step_time: 1412ms, lr: 4.904131e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:16,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.66318 samples/s/p 1:45:44 } +2024-07-30 04:23:19,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1761/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 4.9006767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:19,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.65778 samples/s/p 1:45:47 } +2024-07-30 04:23:22,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1763/ 3125], loss: 0.241, per_step_time: 1412ms, lr: 4.8972224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:22,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.66200 samples/s/p 1:45:39 } +2024-07-30 04:23:25,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1765/ 3125], loss: 0.257, per_step_time: 1412ms, lr: 4.8937677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:25,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.66228 samples/s/p 1:45:36 } +2024-07-30 04:23:28,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1767/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 4.8903134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:28,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.65939 samples/s/p 1:45:37 } +2024-07-30 04:23:31,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1769/ 3125], loss: 0.370, per_step_time: 1414ms, lr: 4.8868596e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:31,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.65688 samples/s/p 1:45:37 } +2024-07-30 04:23:33,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1771/ 3125], loss: 0.291, per_step_time: 1413ms, lr: 4.883406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:33,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.65959 samples/s/p 1:45:31 } +2024-07-30 04:23:36,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1773/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 4.879952e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:36,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.65878 samples/s/p 1:45:29 } +2024-07-30 04:23:39,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1775/ 3125], loss: 0.125, per_step_time: 1413ms, lr: 4.8764978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:39,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.66096 samples/s/p 1:45:24 } +2024-07-30 04:23:42,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1777/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 4.873044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:42,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.66036 samples/s/p 1:45:21 } +2024-07-30 04:23:45,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1779/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 4.8695906e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:45,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.66146 samples/s/p 1:45:17 } +2024-07-30 04:23:48,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1781/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 4.866136e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:48,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.65868 samples/s/p 1:45:18 } +2024-07-30 04:23:50,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1783/ 3125], loss: 0.181, per_step_time: 1412ms, lr: 4.8626825e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:50,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.66301 samples/s/p 1:45:10 } +2024-07-30 04:23:53,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1785/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 4.859229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:53,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.65970 samples/s/p 1:45:11 } +2024-07-30 04:23:56,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1787/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 4.855775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:56,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.66013 samples/s/p 1:45:07 } +2024-07-30 04:23:59,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1789/ 3125], loss: 0.286, per_step_time: 1414ms, lr: 4.852322e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:23:59,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.65618 samples/s/p 1:45:09 } +2024-07-30 04:24:02,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1791/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 4.8488687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:02,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.65838 samples/s/p 1:45:04 } +2024-07-30 04:24:05,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1793/ 3125], loss: 0.276, per_step_time: 1414ms, lr: 4.845416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:05,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.65633 samples/s/p 1:45:03 } +2024-07-30 04:24:07,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1795/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 4.8419615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:07,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.65787 samples/s/p 1:44:59 } +2024-07-30 04:24:10,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1797/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 4.8385086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:10,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.65854 samples/s/p 1:44:55 } +2024-07-30 04:24:13,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1799/ 3125], loss: 0.273, per_step_time: 1412ms, lr: 4.8350553e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:13,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.66226 samples/s/p 1:44:48 } +2024-07-30 04:24:16,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1801/ 3125], loss: 0.288, per_step_time: 1415ms, lr: 4.8316024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:16,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.65333 samples/s/p 1:44:55 } +2024-07-30 04:24:19,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1803/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 4.82815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:19,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.66096 samples/s/p 1:44:44 } +2024-07-30 04:24:22,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1805/ 3125], loss: 0.420, per_step_time: 1412ms, lr: 4.824697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:22,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.66251 samples/s/p 1:44:39 } +2024-07-30 04:24:24,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1807/ 3125], loss: 0.233, per_step_time: 1412ms, lr: 4.821244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:25,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.66191 samples/s/p 1:44:37 } +2024-07-30 04:24:27,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1809/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 4.8177913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:27,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.66117 samples/s/p 1:44:35 } +2024-07-30 04:24:30,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1811/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 4.814338e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:30,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.66165 samples/s/p 1:44:32 } +2024-07-30 04:24:33,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1813/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 4.810886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:33,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.65884 samples/s/p 1:44:32 } +2024-07-30 04:24:36,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1815/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 4.8074335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:36,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.66084 samples/s/p 1:44:27 } +2024-07-30 04:24:39,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1817/ 3125], loss: 0.556, per_step_time: 1413ms, lr: 4.8039815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:39,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.65952 samples/s/p 1:44:26 } +2024-07-30 04:24:42,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1819/ 3125], loss: 0.369, per_step_time: 1412ms, lr: 4.800529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:42,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.66224 samples/s/p 1:44:20 } +2024-07-30 04:24:44,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1821/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 4.797077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:44,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.66139 samples/s/p 1:44:18 } +2024-07-30 04:24:47,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1823/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 4.793624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:47,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.65808 samples/s/p 1:44:19 } +2024-07-30 04:24:50,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1825/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 4.7901726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:50,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.66123 samples/s/p 1:44:13 } +2024-07-30 04:24:53,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1827/ 3125], loss: 0.103, per_step_time: 1413ms, lr: 4.7867206e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:53,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.65990 samples/s/p 1:44:11 } +2024-07-30 04:24:56,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1829/ 3125], loss: 0.094, per_step_time: 1413ms, lr: 4.7832696e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:56,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.65850 samples/s/p 1:44:10 } +2024-07-30 04:24:59,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1831/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 4.779817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:24:59,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.66094 samples/s/p 1:44:04 } +2024-07-30 04:25:01,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1833/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 4.776366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:01,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.66069 samples/s/p 1:44:02 } +2024-07-30 04:25:04,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1835/ 3125], loss: 0.141, per_step_time: 1413ms, lr: 4.772915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:04,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.66067 samples/s/p 1:43:59 } +2024-07-30 04:25:07,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1837/ 3125], loss: 0.406, per_step_time: 1416ms, lr: 4.769464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:07,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.64605 samples/s/p 1:44:12 } +2024-07-30 04:25:10,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1839/ 3125], loss: 0.384, per_step_time: 1413ms, lr: 4.766012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:10,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.66135 samples/s/p 1:43:53 } +2024-07-30 04:25:13,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1841/ 3125], loss: 0.415, per_step_time: 1413ms, lr: 4.762561e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:13,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.65805 samples/s/p 1:43:53 } +2024-07-30 04:25:16,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1843/ 3125], loss: 0.231, per_step_time: 1414ms, lr: 4.7591093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:16,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.65411 samples/s/p 1:43:55 } +2024-07-30 04:25:18,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1845/ 3125], loss: 0.663, per_step_time: 1416ms, lr: 4.755659e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:18,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.64718 samples/s/p 1:44:00 } +2024-07-30 04:25:21,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1847/ 3125], loss: 0.470, per_step_time: 1413ms, lr: 4.7522085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:21,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.65984 samples/s/p 1:43:43 } +2024-07-30 04:25:24,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1849/ 3125], loss: 0.412, per_step_time: 1414ms, lr: 4.748758e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:24,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.65696 samples/s/p 1:43:43 } +2024-07-30 04:25:27,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1851/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 4.7453073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:27,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.66104 samples/s/p 1:43:36 } +2024-07-30 04:25:30,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1853/ 3125], loss: 0.385, per_step_time: 1413ms, lr: 4.741856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:30,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.65889 samples/s/p 1:43:36 } +2024-07-30 04:25:33,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1855/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 4.738406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:33,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.66145 samples/s/p 1:43:30 } +2024-07-30 04:25:35,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1857/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 4.734956e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:35,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.66114 samples/s/p 1:43:27 } +2024-07-30 04:25:38,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1859/ 3125], loss: 0.089, per_step_time: 1414ms, lr: 4.731506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:38,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.65393 samples/s/p 1:43:33 } +2024-07-30 04:25:41,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1861/ 3125], loss: 0.364, per_step_time: 1414ms, lr: 4.728057e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:41,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.65689 samples/s/p 1:43:26 } +2024-07-30 04:25:44,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1863/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 4.7246062e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:44,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.66013 samples/s/p 1:43:20 } +2024-07-30 04:25:47,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1865/ 3125], loss: 0.362, per_step_time: 1414ms, lr: 4.721157e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:47,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.65711 samples/s/p 1:43:21 } +2024-07-30 04:25:50,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1867/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 4.717707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:50,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.65997 samples/s/p 1:43:15 } +2024-07-30 04:25:52,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1869/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 4.7142576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:52,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.66126 samples/s/p 1:43:10 } +2024-07-30 04:25:55,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1871/ 3125], loss: 0.289, per_step_time: 1415ms, lr: 4.7108088e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:55,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.65154 samples/s/p 1:43:18 } +2024-07-30 04:25:58,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1873/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 4.70736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:25:58,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.66100 samples/s/p 1:43:05 } +2024-07-30 04:26:01,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1875/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 4.7039107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:01,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.66047 samples/s/p 1:43:03 } +2024-07-30 04:26:04,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1877/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 4.700462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:04,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.66000 samples/s/p 1:43:00 } +2024-07-30 04:26:07,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1879/ 3125], loss: 0.197, per_step_time: 1413ms, lr: 4.6970135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:07,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.66010 samples/s/p 1:42:57 } +2024-07-30 04:26:09,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1881/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 4.6935643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:09,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.65893 samples/s/p 1:42:56 } +2024-07-30 04:26:12,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1883/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 4.690116e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:12,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.65894 samples/s/p 1:42:53 } +2024-07-30 04:26:15,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1885/ 3125], loss: 0.450, per_step_time: 1412ms, lr: 4.686668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:15,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.66322 samples/s/p 1:42:46 } +2024-07-30 04:26:18,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1887/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 4.6832197e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:18,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.65974 samples/s/p 1:42:47 } +2024-07-30 04:26:21,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1889/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 4.679772e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:21,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.65832 samples/s/p 1:42:45 } +2024-07-30 04:26:24,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1891/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 4.6763244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:24,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.65884 samples/s/p 1:42:42 } +2024-07-30 04:26:26,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1893/ 3125], loss: 0.161, per_step_time: 1414ms, lr: 4.672877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:26,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.65650 samples/s/p 1:42:42 } +2024-07-30 04:26:29,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1895/ 3125], loss: 0.257, per_step_time: 1412ms, lr: 4.6694286e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:29,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.66218 samples/s/p 1:42:33 } +2024-07-30 04:26:32,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1897/ 3125], loss: 0.409, per_step_time: 1413ms, lr: 4.6659816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:32,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.65983 samples/s/p 1:42:32 } +2024-07-30 04:26:35,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1899/ 3125], loss: 0.394, per_step_time: 1412ms, lr: 4.662534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:35,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.66181 samples/s/p 1:42:27 } +2024-07-30 04:26:38,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1901/ 3125], loss: 0.136, per_step_time: 1412ms, lr: 4.659087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:38,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.66174 samples/s/p 1:42:25 } +2024-07-30 04:26:41,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1903/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 4.655641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:41,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.66060 samples/s/p 1:42:23 } +2024-07-30 04:26:43,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1905/ 3125], loss: 0.525, per_step_time: 1413ms, lr: 4.652194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:43,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.66150 samples/s/p 1:42:19 } +2024-07-30 04:26:46,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1907/ 3125], loss: 0.129, per_step_time: 1413ms, lr: 4.648748e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:46,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.66071 samples/s/p 1:42:17 } +2024-07-30 04:26:49,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1909/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 4.6453015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:49,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.65943 samples/s/p 1:42:16 } +2024-07-30 04:26:52,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1911/ 3125], loss: 0.398, per_step_time: 1413ms, lr: 4.6418545e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:52,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.66162 samples/s/p 1:42:11 } +2024-07-30 04:26:55,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1913/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 4.6384084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:55,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.66032 samples/s/p 1:42:09 } +2024-07-30 04:26:58,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1915/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 4.6349633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:26:58,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.66144 samples/s/p 1:42:05 } +2024-07-30 04:27:00,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1917/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 4.6315176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:00,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.66159 samples/s/p 1:42:02 } +2024-07-30 04:27:03,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1919/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 4.6280725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:03,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.65997 samples/s/p 1:42:01 } +2024-07-30 04:27:06,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1921/ 3125], loss: 0.118, per_step_time: 1414ms, lr: 4.624627e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:06,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.65722 samples/s/p 1:42:01 } +2024-07-30 04:27:09,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1923/ 3125], loss: 0.213, per_step_time: 1414ms, lr: 4.621182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:09,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.65432 samples/s/p 1:42:02 } +2024-07-30 04:27:12,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1925/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 4.617736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:12,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.65791 samples/s/p 1:41:55 } +2024-07-30 04:27:15,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1927/ 3125], loss: 0.150, per_step_time: 1414ms, lr: 4.614292e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:15,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.65768 samples/s/p 1:41:52 } +2024-07-30 04:27:17,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1929/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 4.6108476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:17,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.65908 samples/s/p 1:41:48 } +2024-07-30 04:27:20,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1931/ 3125], loss: 0.541, per_step_time: 1413ms, lr: 4.6074033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:20,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.66149 samples/s/p 1:41:42 } +2024-07-30 04:27:23,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1933/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 4.603959e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:23,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.65932 samples/s/p 1:41:42 } +2024-07-30 04:27:26,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1935/ 3125], loss: 0.469, per_step_time: 1413ms, lr: 4.6005152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:26,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.65889 samples/s/p 1:41:40 } +2024-07-30 04:27:29,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1937/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 4.5970714e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:29,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.65981 samples/s/p 1:41:36 } +2024-07-30 04:27:32,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1939/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 4.593627e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:32,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |███████████████████████████ | 5.66024 samples/s/p 1:41:33 } +2024-07-30 04:27:34,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1941/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 4.590184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:34,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |███████████████████████████ | 5.65952 samples/s/p 1:41:30 } +2024-07-30 04:27:37,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1943/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 4.586741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:37,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.66111 samples/s/p 1:41:26 } +2024-07-30 04:27:40,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1945/ 3125], loss: 0.203, per_step_time: 1414ms, lr: 4.5832976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:40,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.65451 samples/s/p 1:41:30 } +2024-07-30 04:27:43,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1947/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 4.579855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:43,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.66019 samples/s/p 1:41:21 } +2024-07-30 04:27:46,231 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1949/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 4.5764127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:46,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.65868 samples/s/p 1:41:20 } +2024-07-30 04:27:49,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1951/ 3125], loss: 0.128, per_step_time: 1414ms, lr: 4.5729703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:49,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.65622 samples/s/p 1:41:20 } +2024-07-30 04:27:51,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1953/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 4.5695274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:51,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.65880 samples/s/p 1:41:14 } +2024-07-30 04:27:54,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1955/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 4.5660854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:54,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.65979 samples/s/p 1:41:10 } +2024-07-30 04:27:57,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1957/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 4.5626434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:27:57,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.66150 samples/s/p 1:41:06 } +2024-07-30 04:28:00,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1959/ 3125], loss: 0.388, per_step_time: 1413ms, lr: 4.559202e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:00,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.66009 samples/s/p 1:41:04 } +2024-07-30 04:28:03,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1961/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 4.555761e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:03,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.66089 samples/s/p 1:41:01 } +2024-07-30 04:28:06,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1963/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 4.55232e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:06,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.66087 samples/s/p 1:40:58 } +2024-07-30 04:28:08,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1965/ 3125], loss: 0.447, per_step_time: 1413ms, lr: 4.5488787e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:08,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.66154 samples/s/p 1:40:54 } +2024-07-30 04:28:11,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1967/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 4.5454376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:11,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.66120 samples/s/p 1:40:52 } +2024-07-30 04:28:14,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1969/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 4.5419965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:14,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.65960 samples/s/p 1:40:51 } +2024-07-30 04:28:17,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1971/ 3125], loss: 0.551, per_step_time: 1413ms, lr: 4.538557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:17,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.66006 samples/s/p 1:40:47 } +2024-07-30 04:28:20,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1973/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 4.535117e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:20,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.66086 samples/s/p 1:40:44 } +2024-07-30 04:28:23,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1975/ 3125], loss: 0.281, per_step_time: 1414ms, lr: 4.5316774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:23,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.65752 samples/s/p 1:40:45 } +2024-07-30 04:28:25,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1977/ 3125], loss: 0.380, per_step_time: 1413ms, lr: 4.5282372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:25,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.66103 samples/s/p 1:40:38 } +2024-07-30 04:28:28,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1979/ 3125], loss: 0.150, per_step_time: 1414ms, lr: 4.5247984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:28,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.65501 samples/s/p 1:40:42 } +2024-07-30 04:28:31,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1981/ 3125], loss: 0.378, per_step_time: 1412ms, lr: 4.521359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:31,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.66223 samples/s/p 1:40:31 } +2024-07-30 04:28:34,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1983/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 4.5179195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:34,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.66129 samples/s/p 1:40:29 } +2024-07-30 04:28:37,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1985/ 3125], loss: 0.598, per_step_time: 1413ms, lr: 4.5144807e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:37,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.65779 samples/s/p 1:40:30 } +2024-07-30 04:28:40,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1987/ 3125], loss: 0.309, per_step_time: 1412ms, lr: 4.511043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:40,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.66291 samples/s/p 1:40:22 } +2024-07-30 04:28:42,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1989/ 3125], loss: 0.072, per_step_time: 1412ms, lr: 4.507604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:42,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.66266 samples/s/p 1:40:19 } +2024-07-30 04:28:45,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1991/ 3125], loss: 0.251, per_step_time: 1412ms, lr: 4.504166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:45,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.66325 samples/s/p 1:40:16 } +2024-07-30 04:28:48,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1993/ 3125], loss: 0.312, per_step_time: 1414ms, lr: 4.5007287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:48,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.65681 samples/s/p 1:40:20 } +2024-07-30 04:28:51,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1995/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 4.4972912e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:51,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.66052 samples/s/p 1:40:13 } +2024-07-30 04:28:54,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1997/ 3125], loss: 0.273, per_step_time: 1414ms, lr: 4.493853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:54,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.65750 samples/s/p 1:40:13 } +2024-07-30 04:28:57,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 1999/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 4.4904164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:57,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.66007 samples/s/p 1:40:08 } +2024-07-30 04:28:59,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2001/ 3125], loss: 0.130, per_step_time: 1414ms, lr: 4.486979e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:28:59,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.65754 samples/s/p 1:40:08 } +2024-07-30 04:29:02,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2003/ 3125], loss: 0.446, per_step_time: 1413ms, lr: 4.483543e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:02,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.66074 samples/s/p 1:40:02 } +2024-07-30 04:29:05,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2005/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 4.480107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:05,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.66049 samples/s/p 1:39:59 } +2024-07-30 04:29:08,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2007/ 3125], loss: 0.148, per_step_time: 1413ms, lr: 4.4766707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:08,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.66053 samples/s/p 1:39:56 } +2024-07-30 04:29:11,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2009/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 4.4732346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:11,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.66017 samples/s/p 1:39:54 } +2024-07-30 04:29:14,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2011/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 4.4697986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:14,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.65903 samples/s/p 1:39:52 } +2024-07-30 04:29:16,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2013/ 3125], loss: 0.226, per_step_time: 1414ms, lr: 4.466363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:16,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.65664 samples/s/p 1:39:52 } +2024-07-30 04:29:19,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2015/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 4.4629282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:19,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.66171 samples/s/p 1:39:44 } +2024-07-30 04:29:22,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2017/ 3125], loss: 0.346, per_step_time: 1413ms, lr: 4.4594935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:22,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.65945 samples/s/p 1:39:43 } +2024-07-30 04:29:25,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2019/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 4.4560597e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:25,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.65813 samples/s/p 1:39:42 } +2024-07-30 04:29:28,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2021/ 3125], loss: 0.144, per_step_time: 1414ms, lr: 4.4526246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:28,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.65469 samples/s/p 1:39:42 } +2024-07-30 04:29:31,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2023/ 3125], loss: 0.206, per_step_time: 1414ms, lr: 4.449191e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:31,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.65739 samples/s/p 1:39:37 } +2024-07-30 04:29:33,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2025/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 4.445756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:33,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.65463 samples/s/p 1:39:37 } +2024-07-30 04:29:36,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2027/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 4.442323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:36,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.65988 samples/s/p 1:39:29 } +2024-07-30 04:29:39,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2029/ 3125], loss: 0.114, per_step_time: 1427ms, lr: 4.4388903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:39,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.60280 samples/s/p 1:40:26 } +2024-07-30 04:29:42,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2031/ 3125], loss: 0.126, per_step_time: 1412ms, lr: 4.435457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:42,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.66392 samples/s/p 1:39:19 } +2024-07-30 04:29:45,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2033/ 3125], loss: 0.208, per_step_time: 1412ms, lr: 4.432024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:45,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.66258 samples/s/p 1:39:17 } +2024-07-30 04:29:48,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2035/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 4.428592e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:48,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.66161 samples/s/p 1:39:15 } +2024-07-30 04:29:50,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2037/ 3125], loss: 0.384, per_step_time: 1413ms, lr: 4.42516e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:50,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.66035 samples/s/p 1:39:14 } +2024-07-30 04:29:53,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2039/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 4.4217286e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:53,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.66068 samples/s/p 1:39:11 } +2024-07-30 04:29:56,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2041/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 4.4182957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:56,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.66135 samples/s/p 1:39:07 } +2024-07-30 04:29:59,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2043/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 4.414865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:29:59,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.65985 samples/s/p 1:39:06 } +2024-07-30 04:30:02,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2045/ 3125], loss: 0.360, per_step_time: 1412ms, lr: 4.4114336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:02,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.66204 samples/s/p 1:39:01 } +2024-07-30 04:30:05,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2047/ 3125], loss: 0.136, per_step_time: 1442ms, lr: 4.408003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:05,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.54574 samples/s/p 1:41:03 } +2024-07-30 04:30:08,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2049/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 4.404573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:08,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.66040 samples/s/p 1:38:57 } +2024-07-30 04:30:10,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2051/ 3125], loss: 0.457, per_step_time: 1413ms, lr: 4.4011426e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:10,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.66058 samples/s/p 1:38:54 } +2024-07-30 04:30:13,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2053/ 3125], loss: 0.081, per_step_time: 1413ms, lr: 4.3977125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:13,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.66140 samples/s/p 1:38:50 } +2024-07-30 04:30:16,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2055/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 4.3942828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:16,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.65987 samples/s/p 1:38:49 } +2024-07-30 04:30:19,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2057/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 4.390853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:19,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.65910 samples/s/p 1:38:47 } +2024-07-30 04:30:22,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2059/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 4.387424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:22,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.66145 samples/s/p 1:38:42 } +2024-07-30 04:30:25,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2061/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 4.3839955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:25,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.65910 samples/s/p 1:38:41 } +2024-07-30 04:30:27,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2063/ 3125], loss: 0.240, per_step_time: 1414ms, lr: 4.380567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:27,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.65747 samples/s/p 1:38:40 } +2024-07-30 04:30:30,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2065/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 4.377139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:30,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.65894 samples/s/p 1:38:36 } +2024-07-30 04:30:33,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2067/ 3125], loss: 0.456, per_step_time: 1413ms, lr: 4.3737114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:33,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.65976 samples/s/p 1:38:32 } +2024-07-30 04:30:36,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2069/ 3125], loss: 0.345, per_step_time: 1412ms, lr: 4.3702826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:36,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.66206 samples/s/p 1:38:27 } +2024-07-30 04:30:39,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2071/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 4.3668556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:39,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.66158 samples/s/p 1:38:25 } +2024-07-30 04:30:42,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2073/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 4.3634286e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:42,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.66037 samples/s/p 1:38:23 } +2024-07-30 04:30:44,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2075/ 3125], loss: 0.453, per_step_time: 1413ms, lr: 4.3600025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:44,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.65919 samples/s/p 1:38:21 } +2024-07-30 04:30:47,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2077/ 3125], loss: 0.347, per_step_time: 1415ms, lr: 4.3565756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:47,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.65310 samples/s/p 1:38:25 } +2024-07-30 04:30:50,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2079/ 3125], loss: 0.239, per_step_time: 1414ms, lr: 4.35315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:50,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.65468 samples/s/p 1:38:20 } +2024-07-30 04:30:53,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2081/ 3125], loss: 0.294, per_step_time: 1414ms, lr: 4.3497243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:53,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.65682 samples/s/p 1:38:15 } +2024-07-30 04:30:56,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2083/ 3125], loss: 0.231, per_step_time: 1416ms, lr: 4.346298e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:56,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.64691 samples/s/p 1:38:23 } +2024-07-30 04:30:59,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2085/ 3125], loss: 0.124, per_step_time: 1413ms, lr: 4.342873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:30:59,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.66004 samples/s/p 1:38:06 } +2024-07-30 04:31:01,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2087/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 4.339449e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:01,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.66137 samples/s/p 1:38:02 } +2024-07-30 04:31:04,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2089/ 3125], loss: 0.176, per_step_time: 1412ms, lr: 4.3360237e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:04,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.66230 samples/s/p 1:37:58 } +2024-07-30 04:31:07,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2091/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 4.3326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:07,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.66165 samples/s/p 1:37:56 } +2024-07-30 04:31:10,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2093/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 4.329176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:10,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.66115 samples/s/p 1:37:54 } +2024-07-30 04:31:13,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2095/ 3125], loss: 0.234, per_step_time: 1412ms, lr: 4.3257533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:13,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.66297 samples/s/p 1:37:49 } +2024-07-30 04:31:16,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2097/ 3125], loss: 0.252, per_step_time: 1412ms, lr: 4.3223286e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:16,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.66217 samples/s/p 1:37:47 } +2024-07-30 04:31:18,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2099/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 4.318906e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:18,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.66034 samples/s/p 1:37:46 } +2024-07-30 04:31:21,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2101/ 3125], loss: 0.409, per_step_time: 1412ms, lr: 4.3154832e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:21,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.66237 samples/s/p 1:37:41 } +2024-07-30 04:31:24,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2103/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 4.3120613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:24,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.66060 samples/s/p 1:37:40 } +2024-07-30 04:31:27,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2105/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 4.3086397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:27,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.66031 samples/s/p 1:37:38 } +2024-07-30 04:31:30,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2107/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 4.305218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:30,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.66060 samples/s/p 1:37:35 } +2024-07-30 04:31:33,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2109/ 3125], loss: 0.384, per_step_time: 1414ms, lr: 4.3017967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:33,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.65750 samples/s/p 1:37:35 } +2024-07-30 04:31:35,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2111/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 4.298376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:35,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.66057 samples/s/p 1:37:29 } +2024-07-30 04:31:38,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2113/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 4.2949546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:38,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.65911 samples/s/p 1:37:28 } +2024-07-30 04:31:41,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2115/ 3125], loss: 0.449, per_step_time: 1413ms, lr: 4.2915344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:41,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.66067 samples/s/p 1:37:23 } +2024-07-30 04:31:44,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2117/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 4.2881147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:44,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.65905 samples/s/p 1:37:22 } +2024-07-30 04:31:47,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2119/ 3125], loss: 0.334, per_step_time: 1413ms, lr: 4.2846955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:47,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.65876 samples/s/p 1:37:20 } +2024-07-30 04:31:50,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2121/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 4.281276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:50,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |███████████████████████████ | 5.66148 samples/s/p 1:37:14 } +2024-07-30 04:31:52,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2123/ 3125], loss: 0.178, per_step_time: 1414ms, lr: 4.2778574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:52,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |███████████████████████████ | 5.65472 samples/s/p 1:37:18 } +2024-07-30 04:31:55,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2125/ 3125], loss: 0.325, per_step_time: 1412ms, lr: 4.274439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:55,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.66242 samples/s/p 1:37:07 } +2024-07-30 04:31:58,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2127/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 4.27102e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:31:58,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.66090 samples/s/p 1:37:06 } +2024-07-30 04:32:01,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2129/ 3125], loss: 0.390, per_step_time: 1413ms, lr: 4.2676024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:01,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.65850 samples/s/p 1:37:06 } +2024-07-30 04:32:04,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2131/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 4.264185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:04,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.65965 samples/s/p 1:37:02 } +2024-07-30 04:32:07,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2133/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 4.2607676e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:07,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.66166 samples/s/p 1:36:57 } +2024-07-30 04:32:09,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2135/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 4.257351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:09,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.66068 samples/s/p 1:36:55 } +2024-07-30 04:32:12,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2137/ 3125], loss: 0.383, per_step_time: 1413ms, lr: 4.253935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:12,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.65776 samples/s/p 1:36:55 } +2024-07-30 04:32:15,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2139/ 3125], loss: 0.202, per_step_time: 1415ms, lr: 4.250519e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:15,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.65269 samples/s/p 1:36:58 } +2024-07-30 04:32:18,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2141/ 3125], loss: 0.498, per_step_time: 1413ms, lr: 4.2471024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:18,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.66076 samples/s/p 1:36:46 } +2024-07-30 04:32:21,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2143/ 3125], loss: 0.146, per_step_time: 1414ms, lr: 4.2436873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:21,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.65726 samples/s/p 1:36:47 } +2024-07-30 04:32:24,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2145/ 3125], loss: 0.457, per_step_time: 1413ms, lr: 4.240272e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:24,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.65827 samples/s/p 1:36:43 } +2024-07-30 04:32:26,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2147/ 3125], loss: 0.206, per_step_time: 1414ms, lr: 4.2368574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:26,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.65616 samples/s/p 1:36:43 } +2024-07-30 04:32:29,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2149/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 4.2334436e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:29,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.66113 samples/s/p 1:36:35 } +2024-07-30 04:32:32,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2151/ 3125], loss: 0.194, per_step_time: 1414ms, lr: 4.23003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:32,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.65558 samples/s/p 1:36:38 } +2024-07-30 04:32:35,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2153/ 3125], loss: 0.188, per_step_time: 1414ms, lr: 4.226616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:35,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.65730 samples/s/p 1:36:33 } +2024-07-30 04:32:38,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2155/ 3125], loss: 0.256, per_step_time: 1418ms, lr: 4.2232023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:38,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.63909 samples/s/p 1:36:49 } +2024-07-30 04:32:41,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2157/ 3125], loss: 0.396, per_step_time: 1414ms, lr: 4.2197894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:41,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.65481 samples/s/p 1:36:30 } +2024-07-30 04:32:43,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2159/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 4.216377e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:43,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.66009 samples/s/p 1:36:22 } +2024-07-30 04:32:46,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2161/ 3125], loss: 0.300, per_step_time: 1414ms, lr: 4.2129655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:46,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.65483 samples/s/p 1:36:24 } +2024-07-30 04:32:49,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2163/ 3125], loss: 0.292, per_step_time: 1412ms, lr: 4.209554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:49,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.66214 samples/s/p 1:36:14 } +2024-07-30 04:32:52,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2165/ 3125], loss: 0.289, per_step_time: 1412ms, lr: 4.2061424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:52,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.66172 samples/s/p 1:36:12 } +2024-07-30 04:32:55,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2167/ 3125], loss: 0.211, per_step_time: 1414ms, lr: 4.2027314e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:55,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.65546 samples/s/p 1:36:15 } +2024-07-30 04:32:58,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2169/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 4.19932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:32:58,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.66065 samples/s/p 1:36:07 } +2024-07-30 04:33:00,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2171/ 3125], loss: 0.269, per_step_time: 1412ms, lr: 4.19591e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:00,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.66225 samples/s/p 1:36:03 } +2024-07-30 04:33:03,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2173/ 3125], loss: 0.463, per_step_time: 1413ms, lr: 4.1925005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:03,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.66055 samples/s/p 1:36:01 } +2024-07-30 04:33:06,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2175/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 4.1890917e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:06,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.65874 samples/s/p 1:36:00 } +2024-07-30 04:33:09,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2177/ 3125], loss: 0.359, per_step_time: 1412ms, lr: 4.185682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:09,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.66190 samples/s/p 1:35:54 } +2024-07-30 04:33:12,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2179/ 3125], loss: 0.340, per_step_time: 1412ms, lr: 4.1822736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:12,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.66202 samples/s/p 1:35:52 } +2024-07-30 04:33:15,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2181/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 4.1788658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:15,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.66136 samples/s/p 1:35:49 } +2024-07-30 04:33:17,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2183/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 4.1754583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:17,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.66003 samples/s/p 1:35:48 } +2024-07-30 04:33:20,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2185/ 3125], loss: 0.204, per_step_time: 1412ms, lr: 4.1720496e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:20,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.66192 samples/s/p 1:35:43 } +2024-07-30 04:33:23,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2187/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 4.168643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:23,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.65843 samples/s/p 1:35:44 } +2024-07-30 04:33:26,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2189/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 4.165236e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:26,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.65908 samples/s/p 1:35:40 } +2024-07-30 04:33:29,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2191/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 4.16183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:29,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.66053 samples/s/p 1:35:36 } +2024-07-30 04:33:32,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2193/ 3125], loss: 0.481, per_step_time: 1413ms, lr: 4.1584244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:32,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.66001 samples/s/p 1:35:34 } +2024-07-30 04:33:34,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2195/ 3125], loss: 0.492, per_step_time: 1415ms, lr: 4.1550193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:34,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.65268 samples/s/p 1:35:38 } +2024-07-30 04:33:37,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2197/ 3125], loss: 0.273, per_step_time: 1414ms, lr: 4.1516146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:37,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.65720 samples/s/p 1:35:31 } +2024-07-30 04:33:40,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2199/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 4.148209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:40,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.65785 samples/s/p 1:35:27 } +2024-07-30 04:33:43,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2201/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 4.1448043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:43,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.65911 samples/s/p 1:35:23 } +2024-07-30 04:33:46,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2203/ 3125], loss: 0.338, per_step_time: 1412ms, lr: 4.141401e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:46,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.66229 samples/s/p 1:35:17 } +2024-07-30 04:33:49,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2205/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 4.1379976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:49,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.65982 samples/s/p 1:35:17 } +2024-07-30 04:33:51,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2207/ 3125], loss: 0.235, per_step_time: 1413ms, lr: 4.1345947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:51,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.66134 samples/s/p 1:35:13 } +2024-07-30 04:33:54,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2209/ 3125], loss: 0.401, per_step_time: 1412ms, lr: 4.131192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:54,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.66254 samples/s/p 1:35:09 } +2024-07-30 04:33:57,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2211/ 3125], loss: 0.233, per_step_time: 1412ms, lr: 4.12779e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:33:57,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.66231 samples/s/p 1:35:06 } +2024-07-30 04:34:00,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2213/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 4.1243875e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:00,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.66127 samples/s/p 1:35:04 } +2024-07-30 04:34:03,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2215/ 3125], loss: 0.232, per_step_time: 1412ms, lr: 4.1209864e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:03,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.66283 samples/s/p 1:35:00 } +2024-07-30 04:34:06,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2217/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 4.117586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:06,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.66019 samples/s/p 1:35:00 } +2024-07-30 04:34:08,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2219/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 4.1141857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:08,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.66070 samples/s/p 1:34:56 } +2024-07-30 04:34:11,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2221/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 4.110785e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:11,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.66159 samples/s/p 1:34:53 } +2024-07-30 04:34:14,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2223/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 4.1073854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:14,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.65987 samples/s/p 1:34:52 } +2024-07-30 04:34:17,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2225/ 3125], loss: 0.285, per_step_time: 1414ms, lr: 4.1039866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:17,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.65745 samples/s/p 1:34:51 } +2024-07-30 04:34:20,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2227/ 3125], loss: 0.265, per_step_time: 1414ms, lr: 4.1005865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:20,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.65525 samples/s/p 1:34:50 } +2024-07-30 04:34:23,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2229/ 3125], loss: 0.402, per_step_time: 1413ms, lr: 4.0971886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:23,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.65873 samples/s/p 1:34:44 } +2024-07-30 04:34:25,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2231/ 3125], loss: 0.579, per_step_time: 1413ms, lr: 4.093791e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:25,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.65838 samples/s/p 1:34:42 } +2024-07-30 04:34:28,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2233/ 3125], loss: 0.166, per_step_time: 1414ms, lr: 4.0903933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:28,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.65718 samples/s/p 1:34:40 } +2024-07-30 04:34:31,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2235/ 3125], loss: 0.143, per_step_time: 1412ms, lr: 4.0869963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:31,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.66172 samples/s/p 1:34:33 } +2024-07-30 04:34:34,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2237/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 4.0836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:34,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.65913 samples/s/p 1:34:32 } +2024-07-30 04:34:37,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2239/ 3125], loss: 0.324, per_step_time: 1414ms, lr: 4.080204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:37,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.65446 samples/s/p 1:34:34 } +2024-07-30 04:34:40,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2241/ 3125], loss: 0.142, per_step_time: 1412ms, lr: 4.0768073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:40,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.66216 samples/s/p 1:34:24 } +2024-07-30 04:34:42,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2243/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 4.073412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:42,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.65832 samples/s/p 1:34:25 } +2024-07-30 04:34:45,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2245/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 4.070017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:45,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.66009 samples/s/p 1:34:20 } +2024-07-30 04:34:48,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2247/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 4.0666228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:48,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.65600 samples/s/p 1:34:21 } +2024-07-30 04:34:51,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2249/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 4.063229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:51,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.65849 samples/s/p 1:34:16 } +2024-07-30 04:34:54,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2251/ 3125], loss: 0.205, per_step_time: 1414ms, lr: 4.0598356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:54,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.65753 samples/s/p 1:34:14 } +2024-07-30 04:34:57,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2253/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 4.056443e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:57,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.66068 samples/s/p 1:34:08 } +2024-07-30 04:34:59,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2255/ 3125], loss: 0.197, per_step_time: 1413ms, lr: 4.0530504e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:34:59,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.65805 samples/s/p 1:34:08 } +2024-07-30 04:35:02,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2257/ 3125], loss: 0.380, per_step_time: 1413ms, lr: 4.049657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:02,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.65835 samples/s/p 1:34:05 } +2024-07-30 04:35:05,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2259/ 3125], loss: 0.338, per_step_time: 1414ms, lr: 4.0462655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:05,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.65460 samples/s/p 1:34:06 } +2024-07-30 04:35:08,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2261/ 3125], loss: 0.310, per_step_time: 1412ms, lr: 4.0428745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:08,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.66212 samples/s/p 1:33:56 } +2024-07-30 04:35:11,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2263/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 4.039484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:11,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.65939 samples/s/p 1:33:55 } +2024-07-30 04:35:14,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2265/ 3125], loss: 0.197, per_step_time: 1412ms, lr: 4.0360937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:14,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.66283 samples/s/p 1:33:49 } +2024-07-30 04:35:16,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2267/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 4.0327036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:16,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.65830 samples/s/p 1:33:51 } +2024-07-30 04:35:19,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2269/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 4.0293144e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:19,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.66052 samples/s/p 1:33:46 } +2024-07-30 04:35:22,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2271/ 3125], loss: 0.302, per_step_time: 1412ms, lr: 4.025924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:22,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.66308 samples/s/p 1:33:40 } +2024-07-30 04:35:25,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2273/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 4.0225364e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:25,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.66081 samples/s/p 1:33:40 } +2024-07-30 04:35:28,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2275/ 3125], loss: 0.459, per_step_time: 1412ms, lr: 4.019148e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:28,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.66212 samples/s/p 1:33:36 } +2024-07-30 04:35:31,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2277/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 4.015761e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:31,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.66087 samples/s/p 1:33:34 } +2024-07-30 04:35:33,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2279/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 4.0123737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:33,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.66006 samples/s/p 1:33:32 } +2024-07-30 04:35:36,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2281/ 3125], loss: 0.136, per_step_time: 1412ms, lr: 4.008987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:36,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.66294 samples/s/p 1:33:26 } +2024-07-30 04:35:39,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2283/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 4.005601e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:39,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.65901 samples/s/p 1:33:28 } +2024-07-30 04:35:42,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2285/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 4.0022146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:42,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.65994 samples/s/p 1:33:24 } +2024-07-30 04:35:45,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2287/ 3125], loss: 0.440, per_step_time: 1413ms, lr: 3.9988295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:45,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.66080 samples/s/p 1:33:20 } +2024-07-30 04:35:48,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2289/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 3.9954452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:48,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.66012 samples/s/p 1:33:18 } +2024-07-30 04:35:50,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2291/ 3125], loss: 0.377, per_step_time: 1412ms, lr: 3.9920606e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:50,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.66244 samples/s/p 1:33:13 } +2024-07-30 04:35:53,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2293/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 3.9886772e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:53,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.65697 samples/s/p 1:33:15 } +2024-07-30 04:35:56,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2295/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 3.985294e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:56,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.65960 samples/s/p 1:33:10 } +2024-07-30 04:35:59,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2297/ 3125], loss: 0.109, per_step_time: 1414ms, lr: 3.9819115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:35:59,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.65655 samples/s/p 1:33:10 } +2024-07-30 04:36:02,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2299/ 3125], loss: 0.496, per_step_time: 1413ms, lr: 3.978528e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:02,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.65809 samples/s/p 1:33:06 } +2024-07-30 04:36:05,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2301/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 3.9751467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:05,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.65842 samples/s/p 1:33:03 } +2024-07-30 04:36:07,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2303/ 3125], loss: 0.450, per_step_time: 1414ms, lr: 3.9717647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:07,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.65536 samples/s/p 1:33:03 } +2024-07-30 04:36:10,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2305/ 3125], loss: 0.127, per_step_time: 1414ms, lr: 3.9683846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:10,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.65763 samples/s/p 1:32:58 } +2024-07-30 04:36:13,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2307/ 3125], loss: 0.341, per_step_time: 1413ms, lr: 3.9650045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:13,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.66053 samples/s/p 1:32:52 } +2024-07-30 04:36:16,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2309/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 3.9616248e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:16,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |████████████████████████████ | 5.66121 samples/s/p 1:32:49 } +2024-07-30 04:36:19,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2311/ 3125], loss: 0.208, per_step_time: 1413ms, lr: 3.958245e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:19,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |████████████████████████████ | 5.66031 samples/s/p 1:32:47 } +2024-07-30 04:36:22,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2313/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 3.9548663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:22,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.65989 samples/s/p 1:32:44 } +2024-07-30 04:36:24,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2315/ 3125], loss: 0.234, per_step_time: 1412ms, lr: 3.951487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:24,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.66285 samples/s/p 1:32:39 } +2024-07-30 04:36:27,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2317/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 3.9481097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:27,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.66029 samples/s/p 1:32:38 } +2024-07-30 04:36:30,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2319/ 3125], loss: 0.322, per_step_time: 1413ms, lr: 3.9447323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:30,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.66031 samples/s/p 1:32:35 } +2024-07-30 04:36:33,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2321/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 3.9413558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:33,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.66108 samples/s/p 1:32:32 } +2024-07-30 04:36:36,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2323/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 3.9379793e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:36,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.66010 samples/s/p 1:32:30 } +2024-07-30 04:36:39,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2325/ 3125], loss: 0.107, per_step_time: 1412ms, lr: 3.9346037e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:39,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.66224 samples/s/p 1:32:25 } +2024-07-30 04:36:41,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2327/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 3.9312285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:41,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.65968 samples/s/p 1:32:25 } +2024-07-30 04:36:44,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2329/ 3125], loss: 0.462, per_step_time: 1413ms, lr: 3.9278525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:44,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.66136 samples/s/p 1:32:20 } +2024-07-30 04:36:47,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2331/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 3.9244787e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:47,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.66016 samples/s/p 1:32:19 } +2024-07-30 04:36:50,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2333/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 3.921105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:50,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.65908 samples/s/p 1:32:17 } +2024-07-30 04:36:53,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2335/ 3125], loss: 0.179, per_step_time: 1414ms, lr: 3.9177316e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:53,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.65713 samples/s/p 1:32:16 } +2024-07-30 04:36:56,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2337/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 3.914359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:56,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.66080 samples/s/p 1:32:09 } +2024-07-30 04:36:58,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2339/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 3.910987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:36:58,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.65879 samples/s/p 1:32:09 } +2024-07-30 04:37:01,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2341/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 3.9076153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:01,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.65816 samples/s/p 1:32:06 } +2024-07-30 04:37:04,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2343/ 3125], loss: 0.305, per_step_time: 1414ms, lr: 3.9042434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:04,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.65648 samples/s/p 1:32:05 } +2024-07-30 04:37:07,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2345/ 3125], loss: 0.082, per_step_time: 1413ms, lr: 3.900873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:07,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.65966 samples/s/p 1:31:59 } +2024-07-30 04:37:10,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2347/ 3125], loss: 0.097, per_step_time: 1414ms, lr: 3.897502e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:10,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.65728 samples/s/p 1:31:59 } +2024-07-30 04:37:13,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2349/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 3.894133e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:13,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.66140 samples/s/p 1:31:52 } +2024-07-30 04:37:15,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2351/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 3.890764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:15,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.65884 samples/s/p 1:31:52 } +2024-07-30 04:37:18,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2353/ 3125], loss: 0.421, per_step_time: 1413ms, lr: 3.887396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:18,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.65934 samples/s/p 1:31:48 } +2024-07-30 04:37:21,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2355/ 3125], loss: 0.323, per_step_time: 1412ms, lr: 3.8840276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:21,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.66303 samples/s/p 1:31:42 } +2024-07-30 04:37:24,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2357/ 3125], loss: 0.412, per_step_time: 1414ms, lr: 3.8806597e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:24,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.65468 samples/s/p 1:31:47 } +2024-07-30 04:37:27,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2359/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 3.8772923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:27,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.66086 samples/s/p 1:31:38 } +2024-07-30 04:37:30,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2361/ 3125], loss: 0.202, per_step_time: 1414ms, lr: 3.873926e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:30,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.65699 samples/s/p 1:31:39 } +2024-07-30 04:37:32,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2363/ 3125], loss: 0.151, per_step_time: 1415ms, lr: 3.8705602e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:32,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.65247 samples/s/p 1:31:41 } +2024-07-30 04:37:35,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2365/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 3.867195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:35,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.65910 samples/s/p 1:31:32 } +2024-07-30 04:37:38,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2367/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 3.86383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:38,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.65945 samples/s/p 1:31:28 } +2024-07-30 04:37:41,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2369/ 3125], loss: 0.330, per_step_time: 1415ms, lr: 3.8604658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:41,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.65238 samples/s/p 1:31:32 } +2024-07-30 04:37:44,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2371/ 3125], loss: 0.040, per_step_time: 1414ms, lr: 3.8571015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:44,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.65636 samples/s/p 1:31:26 } +2024-07-30 04:37:47,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2373/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 3.8537382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:47,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.66169 samples/s/p 1:31:18 } +2024-07-30 04:37:49,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2375/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 3.850376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:49,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.65848 samples/s/p 1:31:18 } +2024-07-30 04:37:52,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2377/ 3125], loss: 0.421, per_step_time: 1413ms, lr: 3.8470143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:52,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.66058 samples/s/p 1:31:13 } +2024-07-30 04:37:55,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2379/ 3125], loss: 0.048, per_step_time: 1413ms, lr: 3.8436524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:55,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.66063 samples/s/p 1:31:10 } +2024-07-30 04:37:58,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2381/ 3125], loss: 0.364, per_step_time: 1416ms, lr: 3.8402914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:37:58,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.64732 samples/s/p 1:31:20 } +2024-07-30 04:38:01,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2383/ 3125], loss: 0.176, per_step_time: 1413ms, lr: 3.8369312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:01,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.65855 samples/s/p 1:31:07 } +2024-07-30 04:38:04,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2385/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 3.8335716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:04,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.65947 samples/s/p 1:31:03 } +2024-07-30 04:38:07,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2387/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 3.8302114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:07,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.66004 samples/s/p 1:31:00 } +2024-07-30 04:38:09,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2389/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 3.826853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:09,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.66069 samples/s/p 1:30:56 } +2024-07-30 04:38:12,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2391/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 3.8234944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:12,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.66139 samples/s/p 1:30:53 } +2024-07-30 04:38:15,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2393/ 3125], loss: 0.215, per_step_time: 1414ms, lr: 3.820137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:15,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.65689 samples/s/p 1:30:54 } +2024-07-30 04:38:18,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2395/ 3125], loss: 0.094, per_step_time: 1413ms, lr: 3.81678e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:18,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.66075 samples/s/p 1:30:48 } +2024-07-30 04:38:21,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2397/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 3.8134237e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:21,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.66050 samples/s/p 1:30:45 } +2024-07-30 04:38:24,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2399/ 3125], loss: 0.156, per_step_time: 1414ms, lr: 3.8100677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:24,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.65374 samples/s/p 1:30:49 } +2024-07-30 04:38:26,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2401/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 3.806712e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:26,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.65841 samples/s/p 1:30:41 } +2024-07-30 04:38:29,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2403/ 3125], loss: 0.595, per_step_time: 1413ms, lr: 3.8033568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:29,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.65971 samples/s/p 1:30:37 } +2024-07-30 04:38:32,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2405/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 3.8000028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:32,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.65924 samples/s/p 1:30:35 } +2024-07-30 04:38:35,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2407/ 3125], loss: 0.425, per_step_time: 1414ms, lr: 3.7966493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:35,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.65646 samples/s/p 1:30:35 } +2024-07-30 04:38:38,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2409/ 3125], loss: 0.322, per_step_time: 1414ms, lr: 3.7932964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:38,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.65706 samples/s/p 1:30:31 } +2024-07-30 04:38:41,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2411/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 3.7899433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:41,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.65892 samples/s/p 1:30:27 } +2024-07-30 04:38:43,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2413/ 3125], loss: 0.084, per_step_time: 1413ms, lr: 3.7865918e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:43,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.66054 samples/s/p 1:30:22 } +2024-07-30 04:38:46,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2415/ 3125], loss: 0.307, per_step_time: 1412ms, lr: 3.7832397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:46,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.66179 samples/s/p 1:30:18 } +2024-07-30 04:38:49,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2417/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 3.7798889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:49,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.66019 samples/s/p 1:30:17 } +2024-07-30 04:38:52,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2419/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 3.7765392e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:52,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.65894 samples/s/p 1:30:15 } +2024-07-30 04:38:55,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2421/ 3125], loss: 0.281, per_step_time: 1412ms, lr: 3.7731897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:55,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.66177 samples/s/p 1:30:10 } +2024-07-30 04:38:58,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2423/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 3.7698403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:38:58,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.65891 samples/s/p 1:30:10 } +2024-07-30 04:39:00,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2425/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 3.7664922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:00,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.65992 samples/s/p 1:30:06 } +2024-07-30 04:39:03,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2427/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 3.7631446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:03,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.65922 samples/s/p 1:30:04 } +2024-07-30 04:39:06,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2429/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 3.7597963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:06,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.66048 samples/s/p 1:30:00 } +2024-07-30 04:39:09,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2431/ 3125], loss: 0.176, per_step_time: 1413ms, lr: 3.7564498e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:09,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.65912 samples/s/p 1:29:58 } +2024-07-30 04:39:12,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2433/ 3125], loss: 0.214, per_step_time: 1414ms, lr: 3.753104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:12,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.65567 samples/s/p 1:29:59 } +2024-07-30 04:39:15,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2435/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 3.7497582e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:15,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.66090 samples/s/p 1:29:51 } +2024-07-30 04:39:17,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2437/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 3.7464135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:17,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.65987 samples/s/p 1:29:49 } +2024-07-30 04:39:20,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2439/ 3125], loss: 0.328, per_step_time: 1415ms, lr: 3.7430698e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:20,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.65223 samples/s/p 1:29:53 } +2024-07-30 04:39:23,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2441/ 3125], loss: 0.256, per_step_time: 1414ms, lr: 3.7397258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:23,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.65705 samples/s/p 1:29:46 } +2024-07-30 04:39:26,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2443/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 3.736382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:26,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.66081 samples/s/p 1:29:40 } +2024-07-30 04:39:29,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2445/ 3125], loss: 0.225, per_step_time: 1414ms, lr: 3.73304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:29,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.65646 samples/s/p 1:29:41 } +2024-07-30 04:39:32,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2447/ 3125], loss: 0.306, per_step_time: 1415ms, lr: 3.7296977e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:32,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.65152 samples/s/p 1:29:43 } +2024-07-30 04:39:34,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2449/ 3125], loss: 0.268, per_step_time: 1413ms, lr: 3.7263565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:34,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.65824 samples/s/p 1:29:34 } +2024-07-30 04:39:37,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2451/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 3.7230163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:37,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.66012 samples/s/p 1:29:29 } +2024-07-30 04:39:40,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2453/ 3125], loss: 0.315, per_step_time: 1414ms, lr: 3.7196764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:40,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.65751 samples/s/p 1:29:29 } +2024-07-30 04:39:43,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2455/ 3125], loss: 0.526, per_step_time: 1413ms, lr: 3.7163363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:43,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.65970 samples/s/p 1:29:24 } +2024-07-30 04:39:46,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2457/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 3.712998e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:46,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.66020 samples/s/p 1:29:20 } +2024-07-30 04:39:49,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2459/ 3125], loss: 0.221, per_step_time: 1412ms, lr: 3.7096588e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:49,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.66206 samples/s/p 1:29:16 } +2024-07-30 04:39:51,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2461/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 3.7063216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:51,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.66086 samples/s/p 1:29:14 } +2024-07-30 04:39:54,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2463/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 3.7029847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:54,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.66009 samples/s/p 1:29:12 } +2024-07-30 04:39:57,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2465/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 3.6996487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:39:57,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.66001 samples/s/p 1:29:09 } +2024-07-30 04:40:00,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2467/ 3125], loss: 0.109, per_step_time: 1413ms, lr: 3.6963124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:00,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.66002 samples/s/p 1:29:06 } +2024-07-30 04:40:03,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2469/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 3.6929775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:03,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.65932 samples/s/p 1:29:04 } +2024-07-30 04:40:06,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2471/ 3125], loss: 0.391, per_step_time: 1412ms, lr: 3.6896433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:06,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.66252 samples/s/p 1:28:58 } +2024-07-30 04:40:08,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2473/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 3.6863087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:08,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.65835 samples/s/p 1:29:00 } +2024-07-30 04:40:11,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2475/ 3125], loss: 0.343, per_step_time: 1412ms, lr: 3.6829756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:11,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.66218 samples/s/p 1:28:53 } +2024-07-30 04:40:11,714 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 04:40:46,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2477/ 3125], loss: 0.064, per_step_time: 1413ms, lr: 3.6796432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:46,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.66104 samples/s/p 1:28:51 } +2024-07-30 04:40:49,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2479/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 3.676311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:49,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.65805 samples/s/p 1:28:51 } +2024-07-30 04:40:51,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2481/ 3125], loss: 0.274, per_step_time: 1412ms, lr: 3.67298e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:51,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.66177 samples/s/p 1:28:45 } +2024-07-30 04:40:54,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2483/ 3125], loss: 0.118, per_step_time: 1413ms, lr: 3.6696492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:54,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.66139 samples/s/p 1:28:43 } +2024-07-30 04:40:57,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2485/ 3125], loss: 0.181, per_step_time: 1415ms, lr: 3.6663198e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:40:57,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.65134 samples/s/p 1:28:49 } +2024-07-30 04:41:00,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2487/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 3.662989e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:00,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.66071 samples/s/p 1:28:38 } +2024-07-30 04:41:03,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2489/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 3.6596607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:03,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.66118 samples/s/p 1:28:34 } +2024-07-30 04:41:06,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2491/ 3125], loss: 0.308, per_step_time: 1415ms, lr: 3.6563322e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:06,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.65000 samples/s/p 1:28:42 } +2024-07-30 04:41:08,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2493/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 3.6530046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:08,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.65846 samples/s/p 1:28:31 } +2024-07-30 04:41:11,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2495/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 3.649678e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:11,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.65927 samples/s/p 1:28:28 } +2024-07-30 04:41:14,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2497/ 3125], loss: 0.399, per_step_time: 1415ms, lr: 3.6463523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:14,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |█████████████████████████████ | 5.65000 samples/s/p 1:28:33 } +2024-07-30 04:41:17,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2499/ 3125], loss: 0.359, per_step_time: 1414ms, lr: 3.6430263e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:17,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |█████████████████████████████ | 5.65721 samples/s/p 1:28:24 } +2024-07-30 04:41:20,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2501/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 3.639701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:20,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.65984 samples/s/p 1:28:19 } +2024-07-30 04:41:23,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2503/ 3125], loss: 0.176, per_step_time: 1414ms, lr: 3.6363765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:23,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.65746 samples/s/p 1:28:18 } +2024-07-30 04:41:25,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2505/ 3125], loss: 0.574, per_step_time: 1424ms, lr: 3.633053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:25,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.61472 samples/s/p 1:28:55 } +2024-07-30 04:41:28,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2507/ 3125], loss: 0.181, per_step_time: 1415ms, lr: 3.6297301e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:28,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.65256 samples/s/p 1:28:17 } +2024-07-30 04:41:31,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2509/ 3125], loss: 0.202, per_step_time: 1414ms, lr: 3.6264082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:31,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.65586 samples/s/p 1:28:11 } +2024-07-30 04:41:34,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2511/ 3125], loss: 0.570, per_step_time: 1414ms, lr: 3.623086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:34,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.65446 samples/s/p 1:28:09 } +2024-07-30 04:41:37,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2513/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 3.6197655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:37,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.66163 samples/s/p 1:28:00 } +2024-07-30 04:41:40,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2515/ 3125], loss: 0.619, per_step_time: 1413ms, lr: 3.616444e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:40,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.65919 samples/s/p 1:27:59 } +2024-07-30 04:41:42,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2517/ 3125], loss: 0.422, per_step_time: 1414ms, lr: 3.6131246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:42,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.65499 samples/s/p 1:28:00 } +2024-07-30 04:41:45,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2519/ 3125], loss: 0.370, per_step_time: 1414ms, lr: 3.6098056e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:45,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.65601 samples/s/p 1:27:57 } +2024-07-30 04:41:48,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2521/ 3125], loss: 0.499, per_step_time: 1413ms, lr: 3.6064878e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:48,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.66029 samples/s/p 1:27:50 } +2024-07-30 04:41:51,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2523/ 3125], loss: 0.164, per_step_time: 1429ms, lr: 3.6031697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:51,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.59668 samples/s/p 1:28:47 } +2024-07-30 04:41:54,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2525/ 3125], loss: 0.048, per_step_time: 1413ms, lr: 3.5998528e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:54,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.66106 samples/s/p 1:27:44 } +2024-07-30 04:41:57,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2527/ 3125], loss: 0.453, per_step_time: 1414ms, lr: 3.5965368e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:41:57,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.65553 samples/s/p 1:27:46 } +2024-07-30 04:42:00,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2529/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 3.5932212e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:00,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.65824 samples/s/p 1:27:41 } +2024-07-30 04:42:02,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2531/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 3.5899054e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:02,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.66022 samples/s/p 1:27:36 } +2024-07-30 04:42:05,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2533/ 3125], loss: 0.200, per_step_time: 1414ms, lr: 3.5865914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:05,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.65482 samples/s/p 1:27:38 } +2024-07-30 04:42:08,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2535/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 3.5832775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:08,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.65943 samples/s/p 1:27:31 } +2024-07-30 04:42:11,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2537/ 3125], loss: 0.054, per_step_time: 1413ms, lr: 3.5799646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:11,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.65928 samples/s/p 1:27:28 } +2024-07-30 04:42:14,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2539/ 3125], loss: 0.462, per_step_time: 1413ms, lr: 3.5766523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:14,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.65861 samples/s/p 1:27:26 } +2024-07-30 04:42:17,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2541/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 3.573341e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:17,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.66149 samples/s/p 1:27:21 } +2024-07-30 04:42:19,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2543/ 3125], loss: 0.343, per_step_time: 1414ms, lr: 3.5700302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:19,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.65654 samples/s/p 1:27:22 } +2024-07-30 04:42:22,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2545/ 3125], loss: 0.206, per_step_time: 1414ms, lr: 3.5667192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:22,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.65768 samples/s/p 1:27:18 } +2024-07-30 04:42:25,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2547/ 3125], loss: 0.118, per_step_time: 1415ms, lr: 3.563409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:25,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.65358 samples/s/p 1:27:19 } +2024-07-30 04:42:28,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2549/ 3125], loss: 0.230, per_step_time: 1414ms, lr: 3.5601004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:28,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.65728 samples/s/p 1:27:13 } +2024-07-30 04:42:31,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2551/ 3125], loss: 0.222, per_step_time: 1412ms, lr: 3.5567923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:31,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.66210 samples/s/p 1:27:06 } +2024-07-30 04:42:34,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2553/ 3125], loss: 0.078, per_step_time: 1414ms, lr: 3.5534852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:34,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.65533 samples/s/p 1:27:09 } +2024-07-30 04:42:36,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2555/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 3.5501782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:36,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.65457 samples/s/p 1:27:07 } +2024-07-30 04:42:39,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2557/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 3.546872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:39,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.65979 samples/s/p 1:26:59 } +2024-07-30 04:42:42,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2559/ 3125], loss: 0.431, per_step_time: 1413ms, lr: 3.5435658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:42,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.66066 samples/s/p 1:26:56 } +2024-07-30 04:42:45,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2561/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 3.5402613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:45,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.66157 samples/s/p 1:26:52 } +2024-07-30 04:42:48,231 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2563/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 3.5369574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:48,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.65913 samples/s/p 1:26:52 } +2024-07-30 04:42:51,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2565/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 3.533654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:51,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.66104 samples/s/p 1:26:47 } +2024-07-30 04:42:53,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2567/ 3125], loss: 0.426, per_step_time: 1413ms, lr: 3.5303517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:53,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.66015 samples/s/p 1:26:45 } +2024-07-30 04:42:56,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2569/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 3.5270493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:56,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.65962 samples/s/p 1:26:43 } +2024-07-30 04:42:59,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2571/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 3.5237483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:42:59,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.66075 samples/s/p 1:26:39 } +2024-07-30 04:43:02,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2573/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 3.5204469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:02,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.65809 samples/s/p 1:26:38 } +2024-07-30 04:43:05,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2575/ 3125], loss: 0.327, per_step_time: 1414ms, lr: 3.5171472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:05,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.65511 samples/s/p 1:26:38 } +2024-07-30 04:43:08,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2577/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 3.5138485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:08,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.65973 samples/s/p 1:26:31 } +2024-07-30 04:43:10,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2579/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 3.5105502e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:10,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.65944 samples/s/p 1:26:29 } +2024-07-30 04:43:13,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2581/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 3.5072524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:13,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.65931 samples/s/p 1:26:26 } +2024-07-30 04:43:16,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2583/ 3125], loss: 0.098, per_step_time: 1413ms, lr: 3.5039554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:16,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.66125 samples/s/p 1:26:21 } +2024-07-30 04:43:19,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2585/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 3.5006594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:19,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.65842 samples/s/p 1:26:21 } +2024-07-30 04:43:22,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2587/ 3125], loss: 0.173, per_step_time: 1415ms, lr: 3.4973639e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:22,245 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.65350 samples/s/p 1:26:23 } +2024-07-30 04:43:25,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2589/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 3.4940683e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:25,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.65974 samples/s/p 1:26:14 } +2024-07-30 04:43:27,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2591/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 3.4907746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:27,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.66143 samples/s/p 1:26:10 } +2024-07-30 04:43:30,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2593/ 3125], loss: 0.070, per_step_time: 1414ms, lr: 3.4874804e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:30,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.65435 samples/s/p 1:26:14 } +2024-07-30 04:43:33,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2595/ 3125], loss: 0.266, per_step_time: 1414ms, lr: 3.4841883e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:33,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.65745 samples/s/p 1:26:08 } +2024-07-30 04:43:36,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2597/ 3125], loss: 0.341, per_step_time: 1414ms, lr: 3.4808963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:36,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.65656 samples/s/p 1:26:06 } +2024-07-30 04:43:39,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2599/ 3125], loss: 0.383, per_step_time: 1414ms, lr: 3.4776056e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:39,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.65528 samples/s/p 1:26:04 } +2024-07-30 04:43:42,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2601/ 3125], loss: 0.194, per_step_time: 1414ms, lr: 3.4743143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:42,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.65731 samples/s/p 1:26:00 } +2024-07-30 04:43:44,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2603/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 3.4710242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:44,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.66166 samples/s/p 1:25:53 } +2024-07-30 04:43:47,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2605/ 3125], loss: 0.440, per_step_time: 1413ms, lr: 3.467735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:47,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.65932 samples/s/p 1:25:52 } +2024-07-30 04:43:50,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2607/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 3.4644468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:50,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.66034 samples/s/p 1:25:48 } +2024-07-30 04:43:53,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2609/ 3125], loss: 0.295, per_step_time: 1414ms, lr: 3.4611594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:53,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.65736 samples/s/p 1:25:48 } +2024-07-30 04:43:56,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2611/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 3.4578727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:56,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.66128 samples/s/p 1:25:42 } +2024-07-30 04:43:59,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2613/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 3.4545865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:43:59,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.65847 samples/s/p 1:25:42 } +2024-07-30 04:44:01,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2615/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 3.4513014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:01,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.66133 samples/s/p 1:25:36 } +2024-07-30 04:44:04,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2617/ 3125], loss: 0.123, per_step_time: 1413ms, lr: 3.4480156e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:04,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.65989 samples/s/p 1:25:35 } +2024-07-30 04:44:07,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2619/ 3125], loss: 0.152, per_step_time: 1414ms, lr: 3.444732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:07,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.65647 samples/s/p 1:25:35 } +2024-07-30 04:44:10,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2621/ 3125], loss: 0.879, per_step_time: 1413ms, lr: 3.4414493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:10,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.65854 samples/s/p 1:25:30 } +2024-07-30 04:44:13,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2623/ 3125], loss: 0.192, per_step_time: 1415ms, lr: 3.438167e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:13,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.65169 samples/s/p 1:25:34 } +2024-07-30 04:44:16,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2625/ 3125], loss: 0.056, per_step_time: 1417ms, lr: 3.434885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:16,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.64345 samples/s/p 1:25:38 } +2024-07-30 04:44:18,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2627/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 3.4316042e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:18,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.65975 samples/s/p 1:25:21 } +2024-07-30 04:44:21,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2629/ 3125], loss: 0.289, per_step_time: 1412ms, lr: 3.4283244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:21,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.66197 samples/s/p 1:25:16 } +2024-07-30 04:44:24,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2631/ 3125], loss: 0.300, per_step_time: 1412ms, lr: 3.4250438e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:24,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.66224 samples/s/p 1:25:13 } +2024-07-30 04:44:27,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2633/ 3125], loss: 0.124, per_step_time: 1415ms, lr: 3.4217655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:27,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.65162 samples/s/p 1:25:19 } +2024-07-30 04:44:30,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2635/ 3125], loss: 0.221, per_step_time: 1412ms, lr: 3.4184877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:30,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.66283 samples/s/p 1:25:06 } +2024-07-30 04:44:33,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2637/ 3125], loss: 0.199, per_step_time: 1414ms, lr: 3.4152101e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:33,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.65714 samples/s/p 1:25:09 } +2024-07-30 04:44:35,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2639/ 3125], loss: 0.533, per_step_time: 1413ms, lr: 3.4119344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:35,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.66089 samples/s/p 1:25:03 } +2024-07-30 04:44:38,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2641/ 3125], loss: 0.310, per_step_time: 1415ms, lr: 3.4086588e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:38,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.65280 samples/s/p 1:25:07 } +2024-07-30 04:44:41,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2643/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 3.405384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:41,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.65973 samples/s/p 1:24:58 } +2024-07-30 04:44:44,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2645/ 3125], loss: 0.170, per_step_time: 1412ms, lr: 3.402109e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:44,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.66322 samples/s/p 1:24:52 } +2024-07-30 04:44:47,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2647/ 3125], loss: 0.377, per_step_time: 1413ms, lr: 3.3988356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:47,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.65851 samples/s/p 1:24:53 } +2024-07-30 04:44:50,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2649/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 3.3955628e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:50,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.65999 samples/s/p 1:24:49 } +2024-07-30 04:44:52,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2651/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 3.3922913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:52,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.65988 samples/s/p 1:24:47 } +2024-07-30 04:44:55,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2653/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 3.3890205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:55,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.66121 samples/s/p 1:24:43 } +2024-07-30 04:44:58,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2655/ 3125], loss: 0.244, per_step_time: 1414ms, lr: 3.3857502e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:44:58,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.65455 samples/s/p 1:24:46 } +2024-07-30 04:45:01,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2657/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 3.3824806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:01,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.65803 samples/s/p 1:24:40 } +2024-07-30 04:45:04,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2659/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 3.3792119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:04,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.66032 samples/s/p 1:24:35 } +2024-07-30 04:45:07,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2661/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 3.3759432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:07,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.66094 samples/s/p 1:24:31 } +2024-07-30 04:45:09,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2663/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 3.3726762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:09,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.65830 samples/s/p 1:24:31 } +2024-07-30 04:45:12,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2665/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 3.36941e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:12,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.65997 samples/s/p 1:24:27 } +2024-07-30 04:45:15,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2667/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 3.3661445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:15,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.65836 samples/s/p 1:24:25 } +2024-07-30 04:45:18,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2669/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 3.3628792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:18,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.65796 samples/s/p 1:24:23 } +2024-07-30 04:45:21,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2671/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 3.3596154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:21,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.66037 samples/s/p 1:24:18 } +2024-07-30 04:45:24,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2673/ 3125], loss: 0.335, per_step_time: 1413ms, lr: 3.3563524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:24,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.66122 samples/s/p 1:24:14 } +2024-07-30 04:45:26,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2675/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 3.353089e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:26,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.66105 samples/s/p 1:24:12 } +2024-07-30 04:45:29,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2677/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 3.3498275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:29,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.65869 samples/s/p 1:24:11 } +2024-07-30 04:45:32,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2679/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 3.3465665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:32,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.65808 samples/s/p 1:24:09 } +2024-07-30 04:45:35,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2681/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 3.3433062e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:35,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.66092 samples/s/p 1:24:03 } +2024-07-30 04:45:38,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2683/ 3125], loss: 0.151, per_step_time: 1413ms, lr: 3.340047e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:38,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.65916 samples/s/p 1:24:02 } +2024-07-30 04:45:41,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2685/ 3125], loss: 0.134, per_step_time: 1414ms, lr: 3.3367887e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:41,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.65520 samples/s/p 1:24:03 } +2024-07-30 04:45:43,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2687/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 3.333531e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:43,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.66129 samples/s/p 1:23:54 } +2024-07-30 04:45:46,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2689/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 3.3302733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:46,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |███████████████████████████████ | 5.66155 samples/s/p 1:23:51 } +2024-07-30 04:45:49,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2691/ 3125], loss: 0.316, per_step_time: 1412ms, lr: 3.3270173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:49,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |███████████████████████████████ | 5.66242 samples/s/p 1:23:48 } +2024-07-30 04:45:52,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2693/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 3.3237618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:52,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.65910 samples/s/p 1:23:48 } +2024-07-30 04:45:55,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2695/ 3125], loss: 0.215, per_step_time: 1416ms, lr: 3.3205074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:55,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.64721 samples/s/p 1:23:56 } +2024-07-30 04:45:58,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2697/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 3.3172535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:45:58,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.65902 samples/s/p 1:23:42 } +2024-07-30 04:46:00,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2699/ 3125], loss: 0.429, per_step_time: 1413ms, lr: 3.3140009e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:00,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.66049 samples/s/p 1:23:38 } +2024-07-30 04:46:03,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2701/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 3.3107483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:03,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.65924 samples/s/p 1:23:36 } +2024-07-30 04:46:06,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2703/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 3.3074969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:06,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.65806 samples/s/p 1:23:35 } +2024-07-30 04:46:09,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2705/ 3125], loss: 0.235, per_step_time: 1413ms, lr: 3.3042456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:09,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.66008 samples/s/p 1:23:30 } +2024-07-30 04:46:12,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2707/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 3.3009962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:12,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.65910 samples/s/p 1:23:28 } +2024-07-30 04:46:15,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2709/ 3125], loss: 0.192, per_step_time: 1414ms, lr: 3.2977473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:15,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.65419 samples/s/p 1:23:30 } +2024-07-30 04:46:17,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2711/ 3125], loss: 0.232, per_step_time: 1414ms, lr: 3.2944995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:17,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.65562 samples/s/p 1:23:25 } +2024-07-30 04:46:20,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2713/ 3125], loss: 0.175, per_step_time: 1415ms, lr: 3.291252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:20,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.65062 samples/s/p 1:23:27 } +2024-07-30 04:46:23,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2715/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 3.2880055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:23,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.66054 samples/s/p 1:23:15 } +2024-07-30 04:46:26,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2717/ 3125], loss: 0.102, per_step_time: 1413ms, lr: 3.2847588e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:26,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.66150 samples/s/p 1:23:12 } +2024-07-30 04:46:29,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2719/ 3125], loss: 0.109, per_step_time: 1413ms, lr: 3.2815146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:29,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.66078 samples/s/p 1:23:10 } +2024-07-30 04:46:32,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2721/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 3.2782705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:32,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.66088 samples/s/p 1:23:07 } +2024-07-30 04:46:35,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2723/ 3125], loss: 0.164, per_step_time: 1413ms, lr: 3.275028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:35,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.65893 samples/s/p 1:23:06 } +2024-07-30 04:46:37,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2725/ 3125], loss: 0.292, per_step_time: 1413ms, lr: 3.2717846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:37,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.66041 samples/s/p 1:23:01 } +2024-07-30 04:46:40,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2727/ 3125], loss: 0.052, per_step_time: 1413ms, lr: 3.2685434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:40,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.66114 samples/s/p 1:22:58 } +2024-07-30 04:46:43,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2729/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 3.265303e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:43,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.65866 samples/s/p 1:22:57 } +2024-07-30 04:46:46,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2731/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 3.2620633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:46,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.66100 samples/s/p 1:22:52 } +2024-07-30 04:46:49,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2733/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 3.2588234e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:49,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.65925 samples/s/p 1:22:51 } +2024-07-30 04:46:52,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2735/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 3.2555854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:52,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.65802 samples/s/p 1:22:49 } +2024-07-30 04:46:54,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2737/ 3125], loss: 0.227, per_step_time: 1414ms, lr: 3.2523476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:54,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.65692 samples/s/p 1:22:48 } +2024-07-30 04:46:57,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2739/ 3125], loss: 0.217, per_step_time: 1428ms, lr: 3.2491112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:46:57,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.60096 samples/s/p 1:23:34 } +2024-07-30 04:47:00,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2741/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 3.2458759e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:00,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.65987 samples/s/p 1:22:39 } +2024-07-30 04:47:03,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2743/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 3.242641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:03,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.66029 samples/s/p 1:22:36 } +2024-07-30 04:47:06,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2745/ 3125], loss: 0.425, per_step_time: 1413ms, lr: 3.2394066e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:06,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.66111 samples/s/p 1:22:33 } +2024-07-30 04:47:09,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2747/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 3.236173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:09,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.66067 samples/s/p 1:22:30 } +2024-07-30 04:47:11,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2749/ 3125], loss: 0.331, per_step_time: 1413ms, lr: 3.2329403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:11,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.66094 samples/s/p 1:22:27 } +2024-07-30 04:47:14,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2751/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 3.2297091e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:14,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.66123 samples/s/p 1:22:24 } +2024-07-30 04:47:17,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2753/ 3125], loss: 0.145, per_step_time: 1413ms, lr: 3.2264786e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:17,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.65884 samples/s/p 1:22:23 } +2024-07-30 04:47:20,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2755/ 3125], loss: 0.465, per_step_time: 1413ms, lr: 3.2232485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:20,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.65899 samples/s/p 1:22:20 } +2024-07-30 04:47:23,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2757/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 3.2200196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:23,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.65959 samples/s/p 1:22:17 } +2024-07-30 04:47:26,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2759/ 3125], loss: 0.294, per_step_time: 1413ms, lr: 3.2167916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:26,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.66151 samples/s/p 1:22:12 } +2024-07-30 04:47:28,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2761/ 3125], loss: 0.275, per_step_time: 1414ms, lr: 3.2135636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:28,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.65639 samples/s/p 1:22:14 } +2024-07-30 04:47:31,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2763/ 3125], loss: 0.136, per_step_time: 1413ms, lr: 3.2103371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:31,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.65829 samples/s/p 1:22:10 } +2024-07-30 04:47:34,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2765/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 3.2071118e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:34,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.65830 samples/s/p 1:22:07 } +2024-07-30 04:47:37,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2767/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 3.2038872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:37,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.65960 samples/s/p 1:22:03 } +2024-07-30 04:47:40,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2769/ 3125], loss: 0.434, per_step_time: 1413ms, lr: 3.200663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:40,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.66076 samples/s/p 1:21:59 } +2024-07-30 04:47:43,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2771/ 3125], loss: 0.446, per_step_time: 1413ms, lr: 3.1974405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:43,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.66061 samples/s/p 1:21:56 } +2024-07-30 04:47:45,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2773/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 3.1942182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:45,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.65780 samples/s/p 1:21:56 } +2024-07-30 04:47:48,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2775/ 3125], loss: 0.213, per_step_time: 1414ms, lr: 3.190996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:48,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.65736 samples/s/p 1:21:53 } +2024-07-30 04:47:51,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2777/ 3125], loss: 0.291, per_step_time: 1415ms, lr: 3.1877757e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:51,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.65209 samples/s/p 1:21:55 } +2024-07-30 04:47:54,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2779/ 3125], loss: 0.201, per_step_time: 1412ms, lr: 3.1845566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:54,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.66182 samples/s/p 1:21:44 } +2024-07-30 04:47:57,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2781/ 3125], loss: 0.353, per_step_time: 1413ms, lr: 3.1813377e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:47:57,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.66008 samples/s/p 1:21:43 } +2024-07-30 04:48:00,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2783/ 3125], loss: 0.294, per_step_time: 1412ms, lr: 3.1781199e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:00,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.66179 samples/s/p 1:21:38 } +2024-07-30 04:48:02,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2785/ 3125], loss: 0.113, per_step_time: 1413ms, lr: 3.1749032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:02,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.66021 samples/s/p 1:21:37 } +2024-07-30 04:48:05,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2787/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 3.171687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:05,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.66042 samples/s/p 1:21:34 } +2024-07-30 04:48:08,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2789/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 3.1684717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:08,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.66089 samples/s/p 1:21:31 } +2024-07-30 04:48:11,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2791/ 3125], loss: 0.480, per_step_time: 1413ms, lr: 3.1652569e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:11,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.66040 samples/s/p 1:21:28 } +2024-07-30 04:48:14,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2793/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 3.162043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:14,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.65989 samples/s/p 1:21:26 } +2024-07-30 04:48:17,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2795/ 3125], loss: 0.254, per_step_time: 1413ms, lr: 3.1588309e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:17,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.65940 samples/s/p 1:21:23 } +2024-07-30 04:48:19,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2797/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 3.1556194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:19,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.66113 samples/s/p 1:21:19 } +2024-07-30 04:48:22,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2799/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 3.152409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:22,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.65990 samples/s/p 1:21:17 } +2024-07-30 04:48:25,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2801/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 3.1491986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:25,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.66089 samples/s/p 1:21:14 } +2024-07-30 04:48:28,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2803/ 3125], loss: 0.385, per_step_time: 1414ms, lr: 3.1459897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:28,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.65516 samples/s/p 1:21:16 } +2024-07-30 04:48:31,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2805/ 3125], loss: 0.419, per_step_time: 1413ms, lr: 3.1427805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:31,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.66156 samples/s/p 1:21:07 } +2024-07-30 04:48:34,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2807/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 3.1395732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:34,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.66016 samples/s/p 1:21:06 } +2024-07-30 04:48:36,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2809/ 3125], loss: 0.219, per_step_time: 1414ms, lr: 3.136367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:36,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.65472 samples/s/p 1:21:08 } +2024-07-30 04:48:39,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2811/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 3.133162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:39,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.66035 samples/s/p 1:21:00 } +2024-07-30 04:48:42,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2813/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 3.1299573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:42,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.65887 samples/s/p 1:20:58 } +2024-07-30 04:48:45,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2815/ 3125], loss: 0.597, per_step_time: 1413ms, lr: 3.1267534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:45,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.65850 samples/s/p 1:20:56 } +2024-07-30 04:48:48,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2817/ 3125], loss: 0.322, per_step_time: 1415ms, lr: 3.1235509e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:48,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.65225 samples/s/p 1:20:58 } +2024-07-30 04:48:51,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2819/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 3.1203479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:51,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.65779 samples/s/p 1:20:51 } +2024-07-30 04:48:53,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2821/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 3.1171471e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:53,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.66103 samples/s/p 1:20:45 } +2024-07-30 04:48:56,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2823/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 3.1139475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:56,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.66115 samples/s/p 1:20:42 } +2024-07-30 04:48:59,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2825/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 3.110748e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:48:59,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.66166 samples/s/p 1:20:39 } +2024-07-30 04:49:02,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2827/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 3.1075494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:02,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.66093 samples/s/p 1:20:37 } +2024-07-30 04:49:05,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2829/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 3.1043523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:05,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.66056 samples/s/p 1:20:34 } +2024-07-30 04:49:08,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2831/ 3125], loss: 0.503, per_step_time: 1413ms, lr: 3.1011564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:08,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.65975 samples/s/p 1:20:32 } +2024-07-30 04:49:10,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2833/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 3.0979597e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:10,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.65780 samples/s/p 1:20:31 } +2024-07-30 04:49:13,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2835/ 3125], loss: 0.214, per_step_time: 1414ms, lr: 3.094765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:13,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.65479 samples/s/p 1:20:31 } +2024-07-30 04:49:16,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2837/ 3125], loss: 0.212, per_step_time: 1412ms, lr: 3.0915708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:16,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.66200 samples/s/p 1:20:22 } +2024-07-30 04:49:19,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2839/ 3125], loss: 0.136, per_step_time: 1413ms, lr: 3.0883782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:19,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.66125 samples/s/p 1:20:20 } +2024-07-30 04:49:22,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2841/ 3125], loss: 0.094, per_step_time: 1412ms, lr: 3.0851863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:22,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.66242 samples/s/p 1:20:16 } +2024-07-30 04:49:25,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2843/ 3125], loss: 0.482, per_step_time: 1416ms, lr: 3.0819954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:25,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.64817 samples/s/p 1:20:25 } +2024-07-30 04:49:27,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2845/ 3125], loss: 0.384, per_step_time: 1415ms, lr: 3.0788058e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:27,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.65110 samples/s/p 1:20:20 } +2024-07-30 04:49:30,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2847/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 3.0756155e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:30,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.65862 samples/s/p 1:20:11 } +2024-07-30 04:49:33,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2849/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 3.0724268e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:33,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.65972 samples/s/p 1:20:07 } +2024-07-30 04:49:36,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2851/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 3.0692397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:36,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.65779 samples/s/p 1:20:06 } +2024-07-30 04:49:39,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2853/ 3125], loss: 0.544, per_step_time: 1413ms, lr: 3.0660533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:39,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.65948 samples/s/p 1:20:01 } +2024-07-30 04:49:42,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2855/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 3.062868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:42,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.66153 samples/s/p 1:19:57 } +2024-07-30 04:49:44,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2857/ 3125], loss: 0.390, per_step_time: 1413ms, lr: 3.0596836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:44,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.66012 samples/s/p 1:19:55 } +2024-07-30 04:49:47,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2859/ 3125], loss: 0.194, per_step_time: 1412ms, lr: 3.0564995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:47,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.66176 samples/s/p 1:19:51 } +2024-07-30 04:49:50,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2861/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 3.053317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:50,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.65994 samples/s/p 1:19:50 } +2024-07-30 04:49:53,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2863/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 3.0501344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:53,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.66097 samples/s/p 1:19:46 } +2024-07-30 04:49:56,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2865/ 3125], loss: 0.275, per_step_time: 1412ms, lr: 3.0469537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:56,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.66196 samples/s/p 1:19:42 } +2024-07-30 04:49:59,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2867/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 3.0437736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:49:59,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.66087 samples/s/p 1:19:40 } +2024-07-30 04:50:01,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2869/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 3.040595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:01,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.66112 samples/s/p 1:19:37 } +2024-07-30 04:50:04,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2871/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 3.0374165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:04,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |███████████████████████████████ | 5.65794 samples/s/p 1:19:37 } +2024-07-30 04:50:07,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2873/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 3.0342396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:07,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |███████████████████████████████ | 5.65380 samples/s/p 1:19:38 } +2024-07-30 04:50:10,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2875/ 3125], loss: 0.374, per_step_time: 1412ms, lr: 3.0310637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:10,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.66267 samples/s/p 1:19:28 } +2024-07-30 04:50:13,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2877/ 3125], loss: 0.305, per_step_time: 1414ms, lr: 3.0278873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:13,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.65689 samples/s/p 1:19:30 } +2024-07-30 04:50:16,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2879/ 3125], loss: 0.043, per_step_time: 1419ms, lr: 3.0247134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:16,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.63664 samples/s/p 1:19:44 } +2024-07-30 04:50:18,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2881/ 3125], loss: 0.512, per_step_time: 1413ms, lr: 3.02154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:18,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.66085 samples/s/p 1:19:21 } +2024-07-30 04:50:21,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2883/ 3125], loss: 0.264, per_step_time: 1412ms, lr: 3.0183671e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:21,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.66180 samples/s/p 1:19:17 } +2024-07-30 04:50:24,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2885/ 3125], loss: 0.169, per_step_time: 1414ms, lr: 3.015196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:24,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.65695 samples/s/p 1:19:18 } +2024-07-30 04:50:27,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2887/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 3.012026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:27,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.66001 samples/s/p 1:19:13 } +2024-07-30 04:50:30,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2889/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 3.008856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:30,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.66164 samples/s/p 1:19:09 } +2024-07-30 04:50:33,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2891/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 3.0056867e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:33,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.66088 samples/s/p 1:19:06 } +2024-07-30 04:50:35,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2893/ 3125], loss: 0.385, per_step_time: 1412ms, lr: 3.0025187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:35,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.66225 samples/s/p 1:19:02 } +2024-07-30 04:50:38,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2895/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 2.999352e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:38,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.66080 samples/s/p 1:19:01 } +2024-07-30 04:50:41,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2897/ 3125], loss: 0.212, per_step_time: 1413ms, lr: 2.9961866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:41,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.65854 samples/s/p 1:19:00 } +2024-07-30 04:50:44,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2899/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 2.9930218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:44,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.66049 samples/s/p 1:18:55 } +2024-07-30 04:50:47,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2901/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 2.9898583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:47,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.66023 samples/s/p 1:18:53 } +2024-07-30 04:50:50,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2903/ 3125], loss: 0.222, per_step_time: 1414ms, lr: 2.9866949e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:50,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.65758 samples/s/p 1:18:52 } +2024-07-30 04:50:52,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2905/ 3125], loss: 0.322, per_step_time: 1413ms, lr: 2.9835319e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:52,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.66037 samples/s/p 1:18:47 } +2024-07-30 04:50:55,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2907/ 3125], loss: 0.115, per_step_time: 1414ms, lr: 2.980371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:55,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.65613 samples/s/p 1:18:48 } +2024-07-30 04:50:58,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2909/ 3125], loss: 0.178, per_step_time: 1413ms, lr: 2.9772114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:50:58,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.65868 samples/s/p 1:18:43 } +2024-07-30 04:51:01,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2911/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 2.9740524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:01,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.65993 samples/s/p 1:18:39 } +2024-07-30 04:51:04,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2913/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 2.9708945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:04,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.65773 samples/s/p 1:18:38 } +2024-07-30 04:51:07,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2915/ 3125], loss: 0.250, per_step_time: 1412ms, lr: 2.9677371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:07,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.66193 samples/s/p 1:18:32 } +2024-07-30 04:51:09,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2917/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 2.9645812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:09,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.65996 samples/s/p 1:18:30 } +2024-07-30 04:51:12,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2919/ 3125], loss: 0.264, per_step_time: 1415ms, lr: 2.961425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:12,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.65347 samples/s/p 1:18:33 } +2024-07-30 04:51:15,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2921/ 3125], loss: 0.233, per_step_time: 1414ms, lr: 2.958271e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:15,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.65760 samples/s/p 1:18:27 } +2024-07-30 04:51:18,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2923/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 2.9551177e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:18,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.65849 samples/s/p 1:18:23 } +2024-07-30 04:51:21,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2925/ 3125], loss: 0.236, per_step_time: 1412ms, lr: 2.9519658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:21,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.66232 samples/s/p 1:18:17 } +2024-07-30 04:51:24,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2927/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 2.9488142e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:24,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.66078 samples/s/p 1:18:16 } +2024-07-30 04:51:26,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2929/ 3125], loss: 0.236, per_step_time: 1412ms, lr: 2.9456642e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:26,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.66181 samples/s/p 1:18:12 } +2024-07-30 04:51:29,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2931/ 3125], loss: 0.321, per_step_time: 1413ms, lr: 2.942515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:29,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.66026 samples/s/p 1:18:10 } +2024-07-30 04:51:32,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2933/ 3125], loss: 0.302, per_step_time: 1414ms, lr: 2.9393668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:32,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.65747 samples/s/p 1:18:10 } +2024-07-30 04:51:35,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2935/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 2.9362188e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:35,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.65918 samples/s/p 1:18:06 } +2024-07-30 04:51:38,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2937/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 2.9330724e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:38,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.66066 samples/s/p 1:18:02 } +2024-07-30 04:51:41,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2939/ 3125], loss: 0.116, per_step_time: 1413ms, lr: 2.9299267e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:41,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.66129 samples/s/p 1:17:58 } +2024-07-30 04:51:43,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2941/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 2.9267826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:43,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.65777 samples/s/p 1:17:58 } +2024-07-30 04:51:46,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2943/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 2.9236394e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:46,808 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.65957 samples/s/p 1:17:54 } +2024-07-30 04:51:49,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2945/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 2.920497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:49,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.66134 samples/s/p 1:17:50 } +2024-07-30 04:51:52,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2947/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 2.917356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:52,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.65790 samples/s/p 1:17:50 } +2024-07-30 04:51:55,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2949/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 2.9142147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:55,310 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.65953 samples/s/p 1:17:46 } +2024-07-30 04:51:58,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2951/ 3125], loss: 0.022, per_step_time: 1412ms, lr: 2.9110752e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:51:58,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.66259 samples/s/p 1:17:40 } +2024-07-30 04:52:00,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2953/ 3125], loss: 0.267, per_step_time: 1414ms, lr: 2.9079372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:00,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.65738 samples/s/p 1:17:42 } +2024-07-30 04:52:03,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2955/ 3125], loss: 0.157, per_step_time: 1412ms, lr: 2.904799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:03,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.66270 samples/s/p 1:17:35 } +2024-07-30 04:52:06,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2957/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 2.9016626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:06,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.66068 samples/s/p 1:17:33 } +2024-07-30 04:52:09,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2959/ 3125], loss: 0.113, per_step_time: 1413ms, lr: 2.8985273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:09,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.65844 samples/s/p 1:17:32 } +2024-07-30 04:52:12,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2961/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 2.8953932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:12,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.66152 samples/s/p 1:17:27 } +2024-07-30 04:52:15,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2963/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 2.8922586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:15,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.66010 samples/s/p 1:17:25 } +2024-07-30 04:52:17,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2965/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 2.8891266e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:17,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.65982 samples/s/p 1:17:23 } +2024-07-30 04:52:20,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2967/ 3125], loss: 0.358, per_step_time: 1414ms, lr: 2.8859954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:20,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.65698 samples/s/p 1:17:22 } +2024-07-30 04:52:23,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2969/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 2.882865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:23,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.66120 samples/s/p 1:17:16 } +2024-07-30 04:52:26,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2971/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 2.8797358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:26,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.66044 samples/s/p 1:17:14 } +2024-07-30 04:52:29,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2973/ 3125], loss: 0.339, per_step_time: 1414ms, lr: 2.8766076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:29,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.65618 samples/s/p 1:17:14 } +2024-07-30 04:52:32,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2975/ 3125], loss: 0.189, per_step_time: 1414ms, lr: 2.8734794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:32,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.65727 samples/s/p 1:17:11 } +2024-07-30 04:52:34,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2977/ 3125], loss: 0.048, per_step_time: 1415ms, lr: 2.8703535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:34,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.65298 samples/s/p 1:17:11 } +2024-07-30 04:52:37,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2979/ 3125], loss: 0.607, per_step_time: 1414ms, lr: 2.867227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:37,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.65631 samples/s/p 1:17:06 } +2024-07-30 04:52:40,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2981/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 2.864103e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:40,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.65964 samples/s/p 1:17:00 } +2024-07-30 04:52:43,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2983/ 3125], loss: 0.097, per_step_time: 1413ms, lr: 2.86098e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:43,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.66132 samples/s/p 1:16:56 } +2024-07-30 04:52:46,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2985/ 3125], loss: 0.277, per_step_time: 1412ms, lr: 2.857858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:46,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.66314 samples/s/p 1:16:52 } +2024-07-30 04:52:49,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2987/ 3125], loss: 0.051, per_step_time: 1413ms, lr: 2.8547367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:49,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.66121 samples/s/p 1:16:51 } +2024-07-30 04:52:52,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2989/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 2.8516167e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:52,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.66060 samples/s/p 1:16:48 } +2024-07-30 04:52:54,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2991/ 3125], loss: 0.142, per_step_time: 1412ms, lr: 2.8484965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:54,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.66201 samples/s/p 1:16:44 } +2024-07-30 04:52:57,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2993/ 3125], loss: 0.114, per_step_time: 1413ms, lr: 2.8453785e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:52:57,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.65833 samples/s/p 1:16:44 } +2024-07-30 04:53:00,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2995/ 3125], loss: 0.278, per_step_time: 1415ms, lr: 2.8422617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:00,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.65173 samples/s/p 1:16:47 } +2024-07-30 04:53:03,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2997/ 3125], loss: 0.344, per_step_time: 1413ms, lr: 2.8391455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:03,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.65842 samples/s/p 1:16:39 } +2024-07-30 04:53:06,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 2999/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 2.8360298e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:06,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.65882 samples/s/p 1:16:36 } +2024-07-30 04:53:09,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3001/ 3125], loss: 0.242, per_step_time: 1414ms, lr: 2.832916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:09,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.65444 samples/s/p 1:16:36 } +2024-07-30 04:53:11,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3003/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 2.8298032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:11,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.65862 samples/s/p 1:16:30 } +2024-07-30 04:53:14,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3005/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 2.8266911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:14,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.65821 samples/s/p 1:16:28 } +2024-07-30 04:53:17,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3007/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 2.8235793e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:17,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.65912 samples/s/p 1:16:24 } +2024-07-30 04:53:20,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3009/ 3125], loss: 0.139, per_step_time: 1413ms, lr: 2.8204697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:20,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.66126 samples/s/p 1:16:19 } +2024-07-30 04:53:23,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3011/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 2.817361e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:23,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.66100 samples/s/p 1:16:17 } +2024-07-30 04:53:26,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3013/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 2.8142535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:26,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.65873 samples/s/p 1:16:16 } +2024-07-30 04:53:28,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3015/ 3125], loss: 0.209, per_step_time: 1412ms, lr: 2.811147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:28,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.66173 samples/s/p 1:16:11 } +2024-07-30 04:53:31,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3017/ 3125], loss: 0.380, per_step_time: 1417ms, lr: 2.8080415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:31,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.64391 samples/s/p 1:16:22 } +2024-07-30 04:53:34,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3019/ 3125], loss: 0.323, per_step_time: 1413ms, lr: 2.8049358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:34,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.65891 samples/s/p 1:16:07 } +2024-07-30 04:53:37,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3021/ 3125], loss: 0.158, per_step_time: 1413ms, lr: 2.8018326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:37,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.65839 samples/s/p 1:16:05 } +2024-07-30 04:53:40,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3023/ 3125], loss: 0.125, per_step_time: 1413ms, lr: 2.798729e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:40,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.65910 samples/s/p 1:16:01 } +2024-07-30 04:53:43,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3025/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 2.7956276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:43,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.66021 samples/s/p 1:15:58 } +2024-07-30 04:53:45,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3027/ 3125], loss: 0.122, per_step_time: 1413ms, lr: 2.7925273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:45,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.65816 samples/s/p 1:15:56 } +2024-07-30 04:53:48,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3029/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 2.7894282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:48,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.65834 samples/s/p 1:15:53 } +2024-07-30 04:53:51,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3031/ 3125], loss: 0.483, per_step_time: 1414ms, lr: 2.78633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:51,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.65580 samples/s/p 1:15:53 } +2024-07-30 04:53:54,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3033/ 3125], loss: 0.305, per_step_time: 1414ms, lr: 2.783233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:54,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.65697 samples/s/p 1:15:49 } +2024-07-30 04:53:57,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3035/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 2.7801354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:53:57,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.66013 samples/s/p 1:15:44 } +2024-07-30 04:54:00,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3037/ 3125], loss: 0.364, per_step_time: 1415ms, lr: 2.7770404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:00,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.65153 samples/s/p 1:15:48 } +2024-07-30 04:54:02,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3039/ 3125], loss: 0.401, per_step_time: 1413ms, lr: 2.7739466e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:02,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.66133 samples/s/p 1:15:37 } +2024-07-30 04:54:05,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3041/ 3125], loss: 0.106, per_step_time: 1413ms, lr: 2.7708536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:05,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.65844 samples/s/p 1:15:36 } +2024-07-30 04:54:08,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3043/ 3125], loss: 0.102, per_step_time: 1413ms, lr: 2.7677606e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:08,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.66115 samples/s/p 1:15:31 } +2024-07-30 04:54:11,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3045/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 2.7646702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:11,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.66145 samples/s/p 1:15:28 } +2024-07-30 04:54:14,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3047/ 3125], loss: 0.335, per_step_time: 1413ms, lr: 2.7615804e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:14,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.66022 samples/s/p 1:15:27 } +2024-07-30 04:54:17,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3049/ 3125], loss: 0.182, per_step_time: 1412ms, lr: 2.7584906e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:17,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.66229 samples/s/p 1:15:22 } +2024-07-30 04:54:19,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3051/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 2.755403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:19,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.66145 samples/s/p 1:15:20 } +2024-07-30 04:54:22,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3053/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 2.7523165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:22,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.65947 samples/s/p 1:15:19 } +2024-07-30 04:54:25,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3055/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 2.7492315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:25,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.65918 samples/s/p 1:15:16 } +2024-07-30 04:54:28,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3057/ 3125], loss: 0.214, per_step_time: 1414ms, lr: 2.746147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:28,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.65664 samples/s/p 1:15:15 } +2024-07-30 04:54:31,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3059/ 3125], loss: 0.276, per_step_time: 1412ms, lr: 2.7430635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:31,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |████████████████████████████████ | 5.66272 samples/s/p 1:15:08 } +2024-07-30 04:54:34,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3061/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 2.7399817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:34,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |████████████████████████████████ | 5.65782 samples/s/p 1:15:09 } +2024-07-30 04:54:36,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3063/ 3125], loss: 0.301, per_step_time: 1414ms, lr: 2.7368992e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:36,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.65597 samples/s/p 1:15:07 } +2024-07-30 04:54:39,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3065/ 3125], loss: 0.355, per_step_time: 1414ms, lr: 2.7338194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:39,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.65375 samples/s/p 1:15:06 } +2024-07-30 04:54:42,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3067/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 2.7307394e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:42,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.65851 samples/s/p 1:15:00 } +2024-07-30 04:54:45,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3069/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 2.7276617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:45,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.66143 samples/s/p 1:14:54 } +2024-07-30 04:54:48,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3071/ 3125], loss: 0.504, per_step_time: 1413ms, lr: 2.7245849e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:48,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.65828 samples/s/p 1:14:54 } +2024-07-30 04:54:51,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3073/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 2.7215092e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:51,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.65963 samples/s/p 1:14:50 } +2024-07-30 04:54:53,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3075/ 3125], loss: 0.285, per_step_time: 1412ms, lr: 2.7184346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:53,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.66176 samples/s/p 1:14:46 } +2024-07-30 04:54:56,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3077/ 3125], loss: 0.393, per_step_time: 1413ms, lr: 2.715361e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:56,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.65936 samples/s/p 1:14:45 } +2024-07-30 04:54:59,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3079/ 3125], loss: 0.137, per_step_time: 1414ms, lr: 2.7122876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:54:59,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.65405 samples/s/p 1:14:46 } +2024-07-30 04:55:02,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3081/ 3125], loss: 0.499, per_step_time: 1413ms, lr: 2.709216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:02,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.66051 samples/s/p 1:14:38 } +2024-07-30 04:55:05,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3083/ 3125], loss: 0.220, per_step_time: 1414ms, lr: 2.7061462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:05,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.65599 samples/s/p 1:14:39 } +2024-07-30 04:55:08,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3085/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 2.7030771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:08,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.66144 samples/s/p 1:14:32 } +2024-07-30 04:55:10,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3087/ 3125], loss: 0.280, per_step_time: 1415ms, lr: 2.7000078e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:10,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.65101 samples/s/p 1:14:37 } +2024-07-30 04:55:13,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3089/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 2.6969408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:13,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.65937 samples/s/p 1:14:28 } +2024-07-30 04:55:16,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3091/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 2.6938749e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:16,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.66057 samples/s/p 1:14:24 } +2024-07-30 04:55:19,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3093/ 3125], loss: 0.408, per_step_time: 1413ms, lr: 2.6908092e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:19,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.65817 samples/s/p 1:14:23 } +2024-07-30 04:55:22,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3095/ 3125], loss: 0.365, per_step_time: 1412ms, lr: 2.6877456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:22,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.66247 samples/s/p 1:14:17 } +2024-07-30 04:55:25,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3097/ 3125], loss: 0.169, per_step_time: 1413ms, lr: 2.684683e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:25,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.65995 samples/s/p 1:14:16 } +2024-07-30 04:55:27,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3099/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 2.6816215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:27,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.65997 samples/s/p 1:14:13 } +2024-07-30 04:55:30,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3101/ 3125], loss: 0.268, per_step_time: 1412ms, lr: 2.678561e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:30,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.66181 samples/s/p 1:14:09 } +2024-07-30 04:55:33,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3103/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 2.6755022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:33,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.65845 samples/s/p 1:14:09 } +2024-07-30 04:55:36,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3105/ 3125], loss: 0.380, per_step_time: 1413ms, lr: 2.672444e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:36,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.66139 samples/s/p 1:14:04 } +2024-07-30 04:55:39,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3107/ 3125], loss: 0.395, per_step_time: 1414ms, lr: 2.6693863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:39,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.65765 samples/s/p 1:14:04 } +2024-07-30 04:55:42,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3109/ 3125], loss: 0.345, per_step_time: 1412ms, lr: 2.6663304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:42,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.66287 samples/s/p 1:13:57 } +2024-07-30 04:55:44,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3111/ 3125], loss: 0.186, per_step_time: 1412ms, lr: 2.6632742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:44,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.66172 samples/s/p 1:13:55 } +2024-07-30 04:55:47,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3113/ 3125], loss: 0.202, per_step_time: 1415ms, lr: 2.6602208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:47,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.65196 samples/s/p 1:14:00 } +2024-07-30 04:55:50,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3115/ 3125], loss: 0.219, per_step_time: 1414ms, lr: 2.6571681e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:50,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.65675 samples/s/p 1:13:53 } +2024-07-30 04:55:53,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3117/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 2.6541168e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:53,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.65831 samples/s/p 1:13:49 } +2024-07-30 04:55:56,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3119/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 2.6510663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:56,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.65964 samples/s/p 1:13:45 } +2024-07-30 04:55:59,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3121/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 2.648016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:55:59,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.66164 samples/s/p 1:13:41 } +2024-07-30 04:56:01,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3123/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 2.644968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:01,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.65946 samples/s/p 1:13:40 } +2024-07-30 04:56:04,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 3], step:[ 3125/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 2.641921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:04,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.66059 samples/s/p 1:13:36 } +2024-07-30 04:56:07,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 2.6388755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:07,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.65800 samples/s/p 1:13:35 } +2024-07-30 04:56:10,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 4/ 3125], loss: 0.209, per_step_time: 1414ms, lr: 2.6358305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:10,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.65690 samples/s/p 1:13:33 } +2024-07-30 04:56:13,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 6/ 3125], loss: 0.401, per_step_time: 1413ms, lr: 2.632786e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:13,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.65878 samples/s/p 1:13:29 } +2024-07-30 04:56:16,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 8/ 3125], loss: 0.274, per_step_time: 1412ms, lr: 2.6297437e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:16,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.66185 samples/s/p 1:13:24 } +2024-07-30 04:56:18,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 10/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 2.6267028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:18,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.65572 samples/s/p 1:13:26 } +2024-07-30 04:56:21,807 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 12/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 2.6236612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:21,808 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.65701 samples/s/p 1:13:22 } +2024-07-30 04:56:24,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 14/ 3125], loss: 0.251, per_step_time: 1414ms, lr: 2.6206224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:24,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.65405 samples/s/p 1:13:21 } +2024-07-30 04:56:27,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 16/ 3125], loss: 0.254, per_step_time: 1414ms, lr: 2.6175844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:27,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.65431 samples/s/p 1:13:18 } +2024-07-30 04:56:30,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 18/ 3125], loss: 0.416, per_step_time: 1413ms, lr: 2.6145476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:30,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.66116 samples/s/p 1:13:10 } +2024-07-30 04:56:33,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 20/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 2.6115122e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:33,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.65875 samples/s/p 1:13:09 } +2024-07-30 04:56:35,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 22/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 2.6084776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:35,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.65975 samples/s/p 1:13:06 } +2024-07-30 04:56:38,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 24/ 3125], loss: 0.292, per_step_time: 1413ms, lr: 2.6054445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:38,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.65972 samples/s/p 1:13:03 } +2024-07-30 04:56:41,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 26/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 2.6024115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:41,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.66040 samples/s/p 1:12:59 } +2024-07-30 04:56:44,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 28/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 2.5993802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:44,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.65988 samples/s/p 1:12:57 } +2024-07-30 04:56:47,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 30/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 2.5963493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:47,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.66149 samples/s/p 1:12:53 } +2024-07-30 04:56:50,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 32/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 2.5933205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:50,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.66032 samples/s/p 1:12:51 } +2024-07-30 04:56:52,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 34/ 3125], loss: 0.275, per_step_time: 1412ms, lr: 2.5902932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:52,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.66184 samples/s/p 1:12:47 } +2024-07-30 04:56:55,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 36/ 3125], loss: 0.366, per_step_time: 1412ms, lr: 2.5872669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:55,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.66200 samples/s/p 1:12:44 } +2024-07-30 04:56:58,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 38/ 3125], loss: 0.348, per_step_time: 1413ms, lr: 2.5842417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:56:58,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.66038 samples/s/p 1:12:42 } +2024-07-30 04:57:01,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 40/ 3125], loss: 0.229, per_step_time: 1412ms, lr: 2.581216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:01,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.66266 samples/s/p 1:12:38 } +2024-07-30 04:57:04,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 42/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 2.5781935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:04,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.65948 samples/s/p 1:12:37 } +2024-07-30 04:57:07,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 44/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 2.5751715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:07,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.65987 samples/s/p 1:12:34 } +2024-07-30 04:57:09,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 46/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 2.5721508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:09,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.66158 samples/s/p 1:12:30 } +2024-07-30 04:57:12,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 48/ 3125], loss: 0.220, per_step_time: 1414ms, lr: 2.569131e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:12,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.65723 samples/s/p 1:12:31 } +2024-07-30 04:57:15,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 50/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 2.5661127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:15,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.66075 samples/s/p 1:12:25 } +2024-07-30 04:57:18,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 52/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 2.5630948e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:18,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.66067 samples/s/p 1:12:22 } +2024-07-30 04:57:21,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 54/ 3125], loss: 0.313, per_step_time: 1412ms, lr: 2.5600777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:21,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.66183 samples/s/p 1:12:19 } +2024-07-30 04:57:24,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 56/ 3125], loss: 0.199, per_step_time: 1413ms, lr: 2.557063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:24,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.65905 samples/s/p 1:12:18 } +2024-07-30 04:57:26,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 58/ 3125], loss: 0.320, per_step_time: 1413ms, lr: 2.5540494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:26,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.65977 samples/s/p 1:12:15 } +2024-07-30 04:57:29,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 60/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 2.5510367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:29,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.66059 samples/s/p 1:12:11 } +2024-07-30 04:57:32,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 62/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 2.5480251e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:32,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.65916 samples/s/p 1:12:09 } +2024-07-30 04:57:35,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 64/ 3125], loss: 0.206, per_step_time: 1412ms, lr: 2.5450151e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:35,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.66239 samples/s/p 1:12:04 } +2024-07-30 04:57:38,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 66/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 2.5420063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:38,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.65873 samples/s/p 1:12:04 } +2024-07-30 04:57:41,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 68/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 2.5389975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:41,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.66137 samples/s/p 1:11:59 } +2024-07-30 04:57:43,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 70/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 2.5359905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:43,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.66163 samples/s/p 1:11:56 } +2024-07-30 04:57:46,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 72/ 3125], loss: 0.413, per_step_time: 1414ms, lr: 2.532985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:46,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.65494 samples/s/p 1:11:59 } +2024-07-30 04:57:49,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 74/ 3125], loss: 0.082, per_step_time: 1413ms, lr: 2.529981e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:49,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.66116 samples/s/p 1:11:51 } +2024-07-30 04:57:52,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 76/ 3125], loss: 0.412, per_step_time: 1414ms, lr: 2.5269765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:52,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.65650 samples/s/p 1:11:52 } +2024-07-30 04:57:55,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 78/ 3125], loss: 0.093, per_step_time: 1414ms, lr: 2.5239747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:55,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.65721 samples/s/p 1:11:48 } +2024-07-30 04:57:58,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 80/ 3125], loss: 0.102, per_step_time: 1412ms, lr: 2.5209742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:57:58,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.66274 samples/s/p 1:11:41 } +2024-07-30 04:58:00,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 82/ 3125], loss: 0.208, per_step_time: 1414ms, lr: 2.5179743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:00,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.65472 samples/s/p 1:11:45 } +2024-07-30 04:58:03,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 84/ 3125], loss: 0.203, per_step_time: 1412ms, lr: 2.514975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:03,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.66226 samples/s/p 1:11:36 } +2024-07-30 04:58:06,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 86/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 2.5119778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:06,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.66074 samples/s/p 1:11:34 } +2024-07-30 04:58:09,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 88/ 3125], loss: 0.132, per_step_time: 1414ms, lr: 2.5089817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:09,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.65575 samples/s/p 1:11:35 } +2024-07-30 04:58:12,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 90/ 3125], loss: 0.296, per_step_time: 1414ms, lr: 2.505987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:12,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.65454 samples/s/p 1:11:33 } +2024-07-30 04:58:15,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 92/ 3125], loss: 0.289, per_step_time: 1412ms, lr: 2.5029933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:15,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.66236 samples/s/p 1:11:25 } +2024-07-30 04:58:18,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 94/ 3125], loss: 0.059, per_step_time: 1413ms, lr: 2.5000008e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:18,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.65853 samples/s/p 1:11:25 } +2024-07-30 04:58:20,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 96/ 3125], loss: 0.201, per_step_time: 1414ms, lr: 2.4970086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:20,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.65549 samples/s/p 1:11:24 } +2024-07-30 04:58:23,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 98/ 3125], loss: 0.089, per_step_time: 1413ms, lr: 2.4940175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:23,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.66165 samples/s/p 1:11:17 } +2024-07-30 04:58:26,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 100/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 2.4910285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:26,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.66168 samples/s/p 1:11:14 } +2024-07-30 04:58:29,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 102/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 2.4880408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:29,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.66119 samples/s/p 1:11:11 } +2024-07-30 04:58:32,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 104/ 3125], loss: 0.186, per_step_time: 1414ms, lr: 2.4850544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:32,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.65578 samples/s/p 1:11:13 } +2024-07-30 04:58:35,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 106/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 2.4820695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:35,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.65860 samples/s/p 1:11:08 } +2024-07-30 04:58:37,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 108/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 2.4790852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:37,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.65867 samples/s/p 1:11:05 } +2024-07-30 04:58:40,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 110/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 2.4761023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:40,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.66134 samples/s/p 1:11:00 } +2024-07-30 04:58:43,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 112/ 3125], loss: 0.174, per_step_time: 1414ms, lr: 2.4731198e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:43,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.65755 samples/s/p 1:11:00 } +2024-07-30 04:58:46,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 114/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 2.4701392e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:46,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.65989 samples/s/p 1:10:55 } +2024-07-30 04:58:49,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 116/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 2.46716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:49,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.66095 samples/s/p 1:10:52 } +2024-07-30 04:58:52,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 118/ 3125], loss: 0.344, per_step_time: 1413ms, lr: 2.464182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:52,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.66035 samples/s/p 1:10:49 } +2024-07-30 04:58:54,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 120/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 2.461204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:54,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.66097 samples/s/p 1:10:46 } +2024-07-30 04:58:57,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 122/ 3125], loss: 0.334, per_step_time: 1413ms, lr: 2.4582287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:58:57,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |█████████████████████████████████ | 5.66014 samples/s/p 1:10:44 } +2024-07-30 04:59:00,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 124/ 3125], loss: 0.114, per_step_time: 1413ms, lr: 2.4552542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:00,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |█████████████████████████████████ | 5.65930 samples/s/p 1:10:42 } +2024-07-30 04:59:03,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 126/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 2.45228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:03,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.66063 samples/s/p 1:10:38 } +2024-07-30 04:59:06,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 128/ 3125], loss: 0.396, per_step_time: 1415ms, lr: 2.4493079e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:06,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.65287 samples/s/p 1:10:41 } +2024-07-30 04:59:09,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 130/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 2.4463372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:09,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.66073 samples/s/p 1:10:32 } +2024-07-30 04:59:11,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 132/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 2.4433677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:11,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.66016 samples/s/p 1:10:30 } +2024-07-30 04:59:14,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 134/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 2.4403994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:14,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.66006 samples/s/p 1:10:27 } +2024-07-30 04:59:17,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 136/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 2.4374324e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:17,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.65984 samples/s/p 1:10:24 } +2024-07-30 04:59:20,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 138/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 2.4344665e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:20,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.65901 samples/s/p 1:10:22 } +2024-07-30 04:59:23,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 140/ 3125], loss: 0.139, per_step_time: 1414ms, lr: 2.431501e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:23,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.65743 samples/s/p 1:10:21 } +2024-07-30 04:59:26,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 142/ 3125], loss: 0.400, per_step_time: 1413ms, lr: 2.4285375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:26,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.66103 samples/s/p 1:10:15 } +2024-07-30 04:59:28,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 144/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 2.4255744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:28,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.66146 samples/s/p 1:10:12 } +2024-07-30 04:59:31,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 146/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 2.422613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:31,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.66107 samples/s/p 1:10:09 } +2024-07-30 04:59:34,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 148/ 3125], loss: 0.408, per_step_time: 1414ms, lr: 2.4196536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:34,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.65444 samples/s/p 1:10:11 } +2024-07-30 04:59:37,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 150/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 2.416695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:37,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.65933 samples/s/p 1:10:05 } +2024-07-30 04:59:40,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 152/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 2.413738e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:40,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.66022 samples/s/p 1:10:01 } +2024-07-30 04:59:43,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 154/ 3125], loss: 0.100, per_step_time: 1413ms, lr: 2.410782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:43,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.66025 samples/s/p 1:09:59 } +2024-07-30 04:59:45,858 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 156/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 2.407826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:45,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.66050 samples/s/p 1:09:56 } +2024-07-30 04:59:48,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 158/ 3125], loss: 0.271, per_step_time: 1419ms, lr: 2.4048725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:48,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.63649 samples/s/p 1:10:11 } +2024-07-30 04:59:51,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 160/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 2.4019203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:51,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.65981 samples/s/p 1:09:50 } +2024-07-30 04:59:54,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 162/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 2.3989692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:54,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.65959 samples/s/p 1:09:48 } +2024-07-30 04:59:57,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 164/ 3125], loss: 0.320, per_step_time: 1413ms, lr: 2.396018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 04:59:57,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.66141 samples/s/p 1:09:44 } +2024-07-30 05:00:00,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 166/ 3125], loss: 0.197, per_step_time: 1413ms, lr: 2.3930697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:00,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.65877 samples/s/p 1:09:43 } +2024-07-30 05:00:02,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 168/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 2.3901223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:02,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.65870 samples/s/p 1:09:40 } +2024-07-30 05:00:05,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 170/ 3125], loss: 0.350, per_step_time: 1416ms, lr: 2.3871753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:05,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.64606 samples/s/p 1:09:46 } +2024-07-30 05:00:08,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 172/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 2.3842304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:08,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.65964 samples/s/p 1:09:34 } +2024-07-30 05:00:11,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 174/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 2.3812868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:11,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.66069 samples/s/p 1:09:30 } +2024-07-30 05:00:14,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 176/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 2.3783446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:14,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.65877 samples/s/p 1:09:29 } +2024-07-30 05:00:17,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 178/ 3125], loss: 0.348, per_step_time: 1414ms, lr: 2.3754033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:17,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.65729 samples/s/p 1:09:27 } +2024-07-30 05:00:19,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 180/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 2.3724635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:19,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.65785 samples/s/p 1:09:24 } +2024-07-30 05:00:22,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 182/ 3125], loss: 0.320, per_step_time: 1414ms, lr: 2.369525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:22,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.65713 samples/s/p 1:09:21 } +2024-07-30 05:00:25,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 184/ 3125], loss: 0.459, per_step_time: 1414ms, lr: 2.3665866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:25,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.65611 samples/s/p 1:09:19 } +2024-07-30 05:00:28,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 186/ 3125], loss: 0.228, per_step_time: 1414ms, lr: 2.3636508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:28,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.65765 samples/s/p 1:09:15 } +2024-07-30 05:00:31,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 188/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 2.360715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:31,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.66102 samples/s/p 1:09:10 } +2024-07-30 05:00:34,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 190/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 2.357781e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:34,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.66166 samples/s/p 1:09:07 } +2024-07-30 05:00:36,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 192/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 2.354849e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:36,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.66025 samples/s/p 1:09:05 } +2024-07-30 05:00:39,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 194/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 2.3519178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:39,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.65916 samples/s/p 1:09:03 } +2024-07-30 05:00:42,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 196/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 2.348988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:42,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.66048 samples/s/p 1:08:59 } +2024-07-30 05:00:45,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 198/ 3125], loss: 0.222, per_step_time: 1412ms, lr: 2.3460586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:45,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.66180 samples/s/p 1:08:55 } +2024-07-30 05:00:48,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 200/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 2.3431312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:48,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.66092 samples/s/p 1:08:53 } +2024-07-30 05:00:51,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 202/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 2.3402056e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:51,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.65955 samples/s/p 1:08:51 } +2024-07-30 05:00:53,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 204/ 3125], loss: 0.330, per_step_time: 1413ms, lr: 2.3372806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:53,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.65925 samples/s/p 1:08:49 } +2024-07-30 05:00:56,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 206/ 3125], loss: 0.396, per_step_time: 1413ms, lr: 2.3343575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:56,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.66157 samples/s/p 1:08:44 } +2024-07-30 05:00:59,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 208/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 2.3314344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:00:59,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.66096 samples/s/p 1:08:42 } +2024-07-30 05:01:02,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 210/ 3125], loss: 0.288, per_step_time: 1412ms, lr: 2.3285136e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:02,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.66177 samples/s/p 1:08:38 } +2024-07-30 05:01:05,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 212/ 3125], loss: 0.287, per_step_time: 1417ms, lr: 2.3255939e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:05,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.64573 samples/s/p 1:08:47 } +2024-07-30 05:01:08,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 214/ 3125], loss: 0.473, per_step_time: 1413ms, lr: 2.3226744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:08,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.66005 samples/s/p 1:08:34 } +2024-07-30 05:01:10,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 216/ 3125], loss: 0.241, per_step_time: 1416ms, lr: 2.3197572e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:10,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.64774 samples/s/p 1:08:40 } +2024-07-30 05:01:13,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 218/ 3125], loss: 0.399, per_step_time: 1413ms, lr: 2.3168413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:13,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.66095 samples/s/p 1:08:28 } +2024-07-30 05:01:16,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 220/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 2.313927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:16,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.65918 samples/s/p 1:08:26 } +2024-07-30 05:01:19,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 222/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 2.311014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:19,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.65897 samples/s/p 1:08:23 } +2024-07-30 05:01:22,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 224/ 3125], loss: 0.213, per_step_time: 1412ms, lr: 2.3081018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:22,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.66207 samples/s/p 1:08:18 } +2024-07-30 05:01:25,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 226/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 2.3051914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:25,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.65962 samples/s/p 1:08:17 } +2024-07-30 05:01:27,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 228/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 2.3022812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:27,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.65966 samples/s/p 1:08:14 } +2024-07-30 05:01:30,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 230/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 2.2993727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:30,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.66136 samples/s/p 1:08:10 } +2024-07-30 05:01:33,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 232/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 2.2964653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:33,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.66069 samples/s/p 1:08:08 } +2024-07-30 05:01:36,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 234/ 3125], loss: 0.231, per_step_time: 1414ms, lr: 2.2935599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:36,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.65394 samples/s/p 1:08:10 } +2024-07-30 05:01:39,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 236/ 3125], loss: 0.349, per_step_time: 1413ms, lr: 2.2906556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:39,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.66087 samples/s/p 1:08:02 } +2024-07-30 05:01:42,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 238/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 2.287753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:42,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.65981 samples/s/p 1:08:00 } +2024-07-30 05:01:44,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 240/ 3125], loss: 0.195, per_step_time: 1413ms, lr: 2.284851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:44,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.66146 samples/s/p 1:07:56 } +2024-07-30 05:01:47,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 242/ 3125], loss: 0.152, per_step_time: 1414ms, lr: 2.2819497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:47,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.65508 samples/s/p 1:07:58 } +2024-07-30 05:01:50,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 244/ 3125], loss: 0.308, per_step_time: 1414ms, lr: 2.279051e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:50,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.65649 samples/s/p 1:07:54 } +2024-07-30 05:01:53,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 246/ 3125], loss: 0.103, per_step_time: 1413ms, lr: 2.2761533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:53,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.66105 samples/s/p 1:07:48 } +2024-07-30 05:01:56,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 248/ 3125], loss: 0.120, per_step_time: 1414ms, lr: 2.2732568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:56,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.65625 samples/s/p 1:07:49 } +2024-07-30 05:01:59,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 250/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 2.2703616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:01:59,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.66014 samples/s/p 1:07:43 } +2024-07-30 05:02:01,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 252/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 2.2674667e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:01,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.66038 samples/s/p 1:07:40 } +2024-07-30 05:02:04,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 254/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 2.2645745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:04,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.66004 samples/s/p 1:07:37 } +2024-07-30 05:02:07,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 256/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 2.261682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:07,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.65823 samples/s/p 1:07:36 } +2024-07-30 05:02:10,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 258/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 2.2587922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:10,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.66000 samples/s/p 1:07:32 } +2024-07-30 05:02:13,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 260/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 2.2559038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:13,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.66167 samples/s/p 1:07:28 } +2024-07-30 05:02:16,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 262/ 3125], loss: 0.442, per_step_time: 1414ms, lr: 2.2530164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:16,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.65405 samples/s/p 1:07:30 } +2024-07-30 05:02:18,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 264/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 2.2501304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:18,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.65832 samples/s/p 1:07:25 } +2024-07-30 05:02:21,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 266/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 2.247246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:21,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.66111 samples/s/p 1:07:20 } +2024-07-30 05:02:24,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 268/ 3125], loss: 0.131, per_step_time: 1414ms, lr: 2.2443626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:24,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.65674 samples/s/p 1:07:20 } +2024-07-30 05:02:27,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 270/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 2.2414795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:27,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.66007 samples/s/p 1:07:15 } +2024-07-30 05:02:30,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 272/ 3125], loss: 0.448, per_step_time: 1413ms, lr: 2.2385987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:30,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.65976 samples/s/p 1:07:12 } +2024-07-30 05:02:33,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 274/ 3125], loss: 0.139, per_step_time: 1413ms, lr: 2.2357194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:33,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.66159 samples/s/p 1:07:08 } +2024-07-30 05:02:35,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 276/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 2.2328406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:35,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.66036 samples/s/p 1:07:06 } +2024-07-30 05:02:38,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 278/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 2.2299637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:38,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.66018 samples/s/p 1:07:03 } +2024-07-30 05:02:41,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 280/ 3125], loss: 0.103, per_step_time: 1412ms, lr: 2.2270885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:41,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.66317 samples/s/p 1:06:58 } +2024-07-30 05:02:44,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 282/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 2.2242143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:44,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.66013 samples/s/p 1:06:58 } +2024-07-30 05:02:47,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 284/ 3125], loss: 0.123, per_step_time: 1413ms, lr: 2.2213417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:47,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.66031 samples/s/p 1:06:55 } +2024-07-30 05:02:50,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 286/ 3125], loss: 0.452, per_step_time: 1413ms, lr: 2.218469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:50,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.66060 samples/s/p 1:06:52 } +2024-07-30 05:02:52,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 288/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 2.2155987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:52,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.66166 samples/s/p 1:06:48 } +2024-07-30 05:02:55,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 290/ 3125], loss: 0.319, per_step_time: 1415ms, lr: 2.21273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:55,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.65368 samples/s/p 1:06:51 } +2024-07-30 05:02:58,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 292/ 3125], loss: 0.234, per_step_time: 1414ms, lr: 2.2098627e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:02:58,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.65607 samples/s/p 1:06:47 } +2024-07-30 05:03:01,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 294/ 3125], loss: 0.413, per_step_time: 1413ms, lr: 2.2069967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:01,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.66110 samples/s/p 1:06:40 } +2024-07-30 05:03:04,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 296/ 3125], loss: 0.140, per_step_time: 1412ms, lr: 2.2041309e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:04,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.66249 samples/s/p 1:06:36 } +2024-07-30 05:03:07,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 298/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 2.2012675e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:07,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.65903 samples/s/p 1:06:36 } +2024-07-30 05:03:09,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 300/ 3125], loss: 0.222, per_step_time: 1412ms, lr: 2.1984042e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:09,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.66223 samples/s/p 1:06:31 } +2024-07-30 05:03:12,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 302/ 3125], loss: 0.172, per_step_time: 1412ms, lr: 2.1955436e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:12,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.66214 samples/s/p 1:06:28 } +2024-07-30 05:03:15,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 304/ 3125], loss: 0.106, per_step_time: 1413ms, lr: 2.192684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:15,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.65876 samples/s/p 1:06:28 } +2024-07-30 05:03:18,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 306/ 3125], loss: 0.305, per_step_time: 1416ms, lr: 2.189826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:18,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.64759 samples/s/p 1:06:33 } +2024-07-30 05:03:21,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 308/ 3125], loss: 0.250, per_step_time: 1412ms, lr: 2.1869691e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:21,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.66180 samples/s/p 1:06:20 } +2024-07-30 05:03:24,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 310/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 2.1841138e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:24,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.66104 samples/s/p 1:06:18 } +2024-07-30 05:03:26,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 312/ 3125], loss: 0.106, per_step_time: 1414ms, lr: 2.18126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:26,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.65624 samples/s/p 1:06:18 } +2024-07-30 05:03:29,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 314/ 3125], loss: 0.510, per_step_time: 1413ms, lr: 2.178406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:29,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |███████████████████████████████████ | 5.65877 samples/s/p 1:06:14 } +2024-07-30 05:03:32,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 316/ 3125], loss: 0.227, per_step_time: 1414ms, lr: 2.175555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:32,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |███████████████████████████████████ | 5.65755 samples/s/p 1:06:12 } +2024-07-30 05:03:35,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 318/ 3125], loss: 0.397, per_step_time: 1413ms, lr: 2.1727046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:35,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.66062 samples/s/p 1:06:07 } +2024-07-30 05:03:38,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 320/ 3125], loss: 0.451, per_step_time: 1412ms, lr: 2.1698552e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:38,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.66192 samples/s/p 1:06:03 } +2024-07-30 05:03:41,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 322/ 3125], loss: 0.272, per_step_time: 1414ms, lr: 2.1670078e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:41,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.65636 samples/s/p 1:06:04 } +2024-07-30 05:03:43,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 324/ 3125], loss: 0.444, per_step_time: 1413ms, lr: 2.1641617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:43,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.65989 samples/s/p 1:05:59 } +2024-07-30 05:03:46,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 326/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 2.161317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:46,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.65833 samples/s/p 1:05:57 } +2024-07-30 05:03:49,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 328/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 2.158473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:49,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.66124 samples/s/p 1:05:52 } +2024-07-30 05:03:52,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 330/ 3125], loss: 0.258, per_step_time: 1412ms, lr: 2.1556311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:52,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.66420 samples/s/p 1:05:47 } +2024-07-30 05:03:55,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 332/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 2.1527903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:55,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.66036 samples/s/p 1:05:47 } +2024-07-30 05:03:58,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 334/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 2.1499513e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:03:58,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.66064 samples/s/p 1:05:44 } +2024-07-30 05:04:00,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 336/ 3125], loss: 0.485, per_step_time: 1413ms, lr: 2.1471137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:00,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.66065 samples/s/p 1:05:41 } +2024-07-30 05:04:03,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 338/ 3125], loss: 0.426, per_step_time: 1413ms, lr: 2.144277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:03,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.65877 samples/s/p 1:05:40 } +2024-07-30 05:04:06,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 340/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 2.141441e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:06,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.65916 samples/s/p 1:05:36 } +2024-07-30 05:04:09,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 342/ 3125], loss: 0.273, per_step_time: 1412ms, lr: 2.1386072e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:09,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.66203 samples/s/p 1:05:32 } +2024-07-30 05:04:12,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 344/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 2.135774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:12,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.65874 samples/s/p 1:05:31 } +2024-07-30 05:04:15,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 346/ 3125], loss: 0.262, per_step_time: 1414ms, lr: 2.1329429e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:15,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.65659 samples/s/p 1:05:30 } +2024-07-30 05:04:17,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 348/ 3125], loss: 0.314, per_step_time: 1414ms, lr: 2.1301134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:17,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.65553 samples/s/p 1:05:28 } +2024-07-30 05:04:20,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 350/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 2.127285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:20,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.65891 samples/s/p 1:05:23 } +2024-07-30 05:04:23,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 352/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 2.1244582e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:23,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.66080 samples/s/p 1:05:18 } +2024-07-30 05:04:26,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 354/ 3125], loss: 0.058, per_step_time: 1413ms, lr: 2.1216326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:26,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.66004 samples/s/p 1:05:16 } +2024-07-30 05:04:29,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 356/ 3125], loss: 0.377, per_step_time: 1413ms, lr: 2.1188087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:29,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.66082 samples/s/p 1:05:13 } +2024-07-30 05:04:32,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 358/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 2.115985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:32,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.65983 samples/s/p 1:05:11 } +2024-07-30 05:04:34,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 360/ 3125], loss: 0.197, per_step_time: 1413ms, lr: 2.1131634e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:34,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.66077 samples/s/p 1:05:07 } +2024-07-30 05:04:37,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 362/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 2.1103435e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:37,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.65942 samples/s/p 1:05:05 } +2024-07-30 05:04:40,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 364/ 3125], loss: 0.402, per_step_time: 1425ms, lr: 2.1075239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:40,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.61074 samples/s/p 1:05:36 } +2024-07-30 05:04:43,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 366/ 3125], loss: 0.134, per_step_time: 1412ms, lr: 2.1047065e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:43,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.66255 samples/s/p 1:04:57 } +2024-07-30 05:04:46,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 368/ 3125], loss: 0.405, per_step_time: 1413ms, lr: 2.1018907e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:46,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.66059 samples/s/p 1:04:56 } +2024-07-30 05:04:49,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 370/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 2.0990763e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:49,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.66073 samples/s/p 1:04:53 } +2024-07-30 05:04:51,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 372/ 3125], loss: 0.299, per_step_time: 1412ms, lr: 2.0962623e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:51,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.66232 samples/s/p 1:04:49 } +2024-07-30 05:04:54,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 374/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 2.0934503e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:54,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.66098 samples/s/p 1:04:47 } +2024-07-30 05:04:57,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 376/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 2.09064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:04:57,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.65942 samples/s/p 1:04:45 } +2024-07-30 05:05:00,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 378/ 3125], loss: 0.187, per_step_time: 1412ms, lr: 2.087831e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:00,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.66215 samples/s/p 1:04:41 } +2024-07-30 05:05:03,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 380/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 2.0850239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:03,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.65828 samples/s/p 1:04:41 } +2024-07-30 05:05:06,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 382/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 2.0822176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:06,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.65982 samples/s/p 1:04:37 } +2024-07-30 05:05:08,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 384/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 2.079413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:08,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.65975 samples/s/p 1:04:34 } +2024-07-30 05:05:11,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 386/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 2.076608e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:11,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.65800 samples/s/p 1:04:32 } +2024-07-30 05:05:14,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 388/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 2.0738055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:14,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.65786 samples/s/p 1:04:30 } +2024-07-30 05:05:17,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 390/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 2.0710047e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:17,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.66105 samples/s/p 1:04:25 } +2024-07-30 05:05:20,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 392/ 3125], loss: 0.240, per_step_time: 1414ms, lr: 2.0682057e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:20,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.65589 samples/s/p 1:04:25 } +2024-07-30 05:05:23,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 394/ 3125], loss: 0.306, per_step_time: 1416ms, lr: 2.065408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:23,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.64821 samples/s/p 1:04:28 } +2024-07-30 05:05:26,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 396/ 3125], loss: 0.127, per_step_time: 1413ms, lr: 2.0626114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:26,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.65934 samples/s/p 1:04:17 } +2024-07-30 05:05:28,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 398/ 3125], loss: 0.328, per_step_time: 1414ms, lr: 2.0598168e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:28,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.65735 samples/s/p 1:04:16 } +2024-07-30 05:05:31,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 400/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 2.0570221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:31,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.66013 samples/s/p 1:04:11 } +2024-07-30 05:05:34,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 402/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 2.05423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:34,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.66163 samples/s/p 1:04:07 } +2024-07-30 05:05:37,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 404/ 3125], loss: 0.255, per_step_time: 1412ms, lr: 2.051439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:37,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.66195 samples/s/p 1:04:04 } +2024-07-30 05:05:40,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 406/ 3125], loss: 0.152, per_step_time: 1412ms, lr: 2.0486498e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:40,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.66223 samples/s/p 1:04:01 } +2024-07-30 05:05:43,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 408/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 2.0458617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:43,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.66129 samples/s/p 1:03:59 } +2024-07-30 05:05:45,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 410/ 3125], loss: 0.260, per_step_time: 1412ms, lr: 2.0430743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:45,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.66263 samples/s/p 1:03:55 } +2024-07-30 05:05:48,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 412/ 3125], loss: 0.390, per_step_time: 1415ms, lr: 2.0402892e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:48,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.65319 samples/s/p 1:03:59 } +2024-07-30 05:05:51,513 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 414/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 2.0375046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:51,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.66068 samples/s/p 1:03:51 } +2024-07-30 05:05:54,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 416/ 3125], loss: 0.178, per_step_time: 1412ms, lr: 2.0347222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:54,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.66215 samples/s/p 1:03:47 } +2024-07-30 05:05:57,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 418/ 3125], loss: 0.521, per_step_time: 1414ms, lr: 2.0319414e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:05:57,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.65765 samples/s/p 1:03:47 } +2024-07-30 05:06:00,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 420/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 2.029162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:00,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.66064 samples/s/p 1:03:42 } +2024-07-30 05:06:02,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 422/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 2.0263842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:02,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.66049 samples/s/p 1:03:40 } +2024-07-30 05:06:05,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 424/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 2.023607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:05,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.65891 samples/s/p 1:03:38 } +2024-07-30 05:06:08,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 426/ 3125], loss: 0.164, per_step_time: 1413ms, lr: 2.0208322e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:08,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.65931 samples/s/p 1:03:35 } +2024-07-30 05:06:11,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 428/ 3125], loss: 0.118, per_step_time: 1413ms, lr: 2.0180582e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:11,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.65825 samples/s/p 1:03:33 } +2024-07-30 05:06:14,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 430/ 3125], loss: 0.393, per_step_time: 1414ms, lr: 2.0152852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:14,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.65721 samples/s/p 1:03:31 } +2024-07-30 05:06:17,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 432/ 3125], loss: 0.254, per_step_time: 1415ms, lr: 2.0125142e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:17,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.65208 samples/s/p 1:03:31 } +2024-07-30 05:06:19,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 434/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 2.0097436e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:19,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.66113 samples/s/p 1:03:22 } +2024-07-30 05:06:22,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 436/ 3125], loss: 0.236, per_step_time: 1412ms, lr: 2.0069756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:22,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.66177 samples/s/p 1:03:19 } +2024-07-30 05:06:25,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 438/ 3125], loss: 0.169, per_step_time: 1413ms, lr: 2.0042091e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:25,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.66164 samples/s/p 1:03:16 } +2024-07-30 05:06:28,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 440/ 3125], loss: 0.332, per_step_time: 1414ms, lr: 2.0014438e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:28,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.65699 samples/s/p 1:03:17 } +2024-07-30 05:06:31,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 442/ 3125], loss: 0.359, per_step_time: 1414ms, lr: 1.9986799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:31,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.65572 samples/s/p 1:03:15 } +2024-07-30 05:06:34,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 444/ 3125], loss: 0.249, per_step_time: 1414ms, lr: 1.9959166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:34,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.65680 samples/s/p 1:03:11 } +2024-07-30 05:06:36,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 446/ 3125], loss: 0.138, per_step_time: 1412ms, lr: 1.9931558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:36,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.66173 samples/s/p 1:03:05 } +2024-07-30 05:06:39,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 448/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 1.9903964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:39,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.65953 samples/s/p 1:03:04 } +2024-07-30 05:06:42,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 450/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 1.9876384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:42,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.66131 samples/s/p 1:03:00 } +2024-07-30 05:06:45,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 452/ 3125], loss: 0.185, per_step_time: 1412ms, lr: 1.9848817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:45,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.66235 samples/s/p 1:02:56 } +2024-07-30 05:06:48,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 454/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 1.9821257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:48,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.66037 samples/s/p 1:02:55 } +2024-07-30 05:06:51,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 456/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 1.9793717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:51,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.66042 samples/s/p 1:02:52 } +2024-07-30 05:06:53,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 458/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 1.9766185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:53,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.65926 samples/s/p 1:02:50 } +2024-07-30 05:06:56,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 460/ 3125], loss: 0.338, per_step_time: 1415ms, lr: 1.9738677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:56,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.65258 samples/s/p 1:02:51 } +2024-07-30 05:06:59,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 462/ 3125], loss: 0.385, per_step_time: 1413ms, lr: 1.9711183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:06:59,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.65834 samples/s/p 1:02:45 } +2024-07-30 05:07:02,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 464/ 3125], loss: 0.441, per_step_time: 1413ms, lr: 1.9683703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:02,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.65872 samples/s/p 1:02:41 } +2024-07-30 05:07:05,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 466/ 3125], loss: 0.331, per_step_time: 1414ms, lr: 1.965624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:05,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.65711 samples/s/p 1:02:40 } +2024-07-30 05:07:08,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 468/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 1.962879e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:08,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.65925 samples/s/p 1:02:35 } +2024-07-30 05:07:10,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 470/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 1.9601353e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:10,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.65849 samples/s/p 1:02:33 } +2024-07-30 05:07:13,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 472/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 1.9573924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:13,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.65942 samples/s/p 1:02:30 } +2024-07-30 05:07:16,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 474/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 1.9546515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:16,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.66130 samples/s/p 1:02:26 } +2024-07-30 05:07:19,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 476/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 1.9519123e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:19,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.66131 samples/s/p 1:02:23 } +2024-07-30 05:07:22,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 478/ 3125], loss: 0.275, per_step_time: 1412ms, lr: 1.9491736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:22,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.66305 samples/s/p 1:02:19 } +2024-07-30 05:07:25,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 480/ 3125], loss: 0.237, per_step_time: 1412ms, lr: 1.9464371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:25,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.66281 samples/s/p 1:02:16 } +2024-07-30 05:07:27,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 482/ 3125], loss: 0.415, per_step_time: 1413ms, lr: 1.9437023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:27,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.66053 samples/s/p 1:02:15 } +2024-07-30 05:07:30,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 484/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 1.9409688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:30,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.65874 samples/s/p 1:02:13 } +2024-07-30 05:07:33,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 486/ 3125], loss: 0.109, per_step_time: 1412ms, lr: 1.938237e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:33,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.66234 samples/s/p 1:02:08 } +2024-07-30 05:07:36,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 488/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 1.9355055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:36,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.65969 samples/s/p 1:02:07 } +2024-07-30 05:07:39,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 490/ 3125], loss: 0.378, per_step_time: 1412ms, lr: 1.9327765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:39,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.66283 samples/s/p 1:02:02 } +2024-07-30 05:07:42,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 492/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 1.930049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:42,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.66047 samples/s/p 1:02:01 } +2024-07-30 05:07:44,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 494/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 1.9273227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:44,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.65856 samples/s/p 1:01:59 } +2024-07-30 05:07:47,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 496/ 3125], loss: 0.438, per_step_time: 1413ms, lr: 1.924598e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:47,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |███████████████████████████████████ | 5.65953 samples/s/p 1:01:56 } +2024-07-30 05:07:50,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 498/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 1.9218742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:50,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |███████████████████████████████████ | 5.65863 samples/s/p 1:01:53 } +2024-07-30 05:07:53,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 500/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 1.9191523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:53,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.66027 samples/s/p 1:01:50 } +2024-07-30 05:07:56,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 502/ 3125], loss: 0.083, per_step_time: 1415ms, lr: 1.916431e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:56,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.65364 samples/s/p 1:01:51 } +2024-07-30 05:07:59,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 504/ 3125], loss: 0.214, per_step_time: 1414ms, lr: 1.9137126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:07:59,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.65672 samples/s/p 1:01:46 } +2024-07-30 05:08:01,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 506/ 3125], loss: 0.513, per_step_time: 1413ms, lr: 1.9109953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:01,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.65778 samples/s/p 1:01:43 } +2024-07-30 05:08:04,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 508/ 3125], loss: 0.122, per_step_time: 1418ms, lr: 1.9082795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:04,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.63839 samples/s/p 1:01:53 } +2024-07-30 05:08:07,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 510/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 1.9055652e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:07,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.66027 samples/s/p 1:01:35 } +2024-07-30 05:08:10,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 512/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 1.9028523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:10,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.65917 samples/s/p 1:01:33 } +2024-07-30 05:08:13,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 514/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 1.9001409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:13,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.66084 samples/s/p 1:01:29 } +2024-07-30 05:08:16,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 516/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 1.89743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:16,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.65982 samples/s/p 1:01:27 } +2024-07-30 05:08:18,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 518/ 3125], loss: 0.083, per_step_time: 1414ms, lr: 1.8947217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:18,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.65635 samples/s/p 1:01:27 } +2024-07-30 05:08:21,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 520/ 3125], loss: 0.139, per_step_time: 1412ms, lr: 1.8920147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:21,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.66414 samples/s/p 1:01:19 } +2024-07-30 05:08:24,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 522/ 3125], loss: 0.269, per_step_time: 1414ms, lr: 1.8893084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:24,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.65700 samples/s/p 1:01:21 } +2024-07-30 05:08:27,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 524/ 3125], loss: 0.303, per_step_time: 1413ms, lr: 1.8866044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:27,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.65978 samples/s/p 1:01:16 } +2024-07-30 05:08:30,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 526/ 3125], loss: 0.138, per_step_time: 1414ms, lr: 1.8839019e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:30,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.65724 samples/s/p 1:01:15 } +2024-07-30 05:08:33,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 528/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 1.8812009e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:33,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.65961 samples/s/p 1:01:10 } +2024-07-30 05:08:35,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 530/ 3125], loss: 0.005, per_step_time: 1412ms, lr: 1.8785005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:35,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.66272 samples/s/p 1:01:06 } +2024-07-30 05:08:38,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 532/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 1.8758026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:38,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.65997 samples/s/p 1:01:05 } +2024-07-30 05:08:41,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 534/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 1.873106e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:41,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.66168 samples/s/p 1:01:01 } +2024-07-30 05:08:44,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 536/ 3125], loss: 0.301, per_step_time: 1413ms, lr: 1.870411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:44,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.65916 samples/s/p 1:00:59 } +2024-07-30 05:08:47,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 538/ 3125], loss: 0.510, per_step_time: 1413ms, lr: 1.8677174e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:47,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.66044 samples/s/p 1:00:56 } +2024-07-30 05:08:50,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 540/ 3125], loss: 0.125, per_step_time: 1414ms, lr: 1.8650254e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:50,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.65534 samples/s/p 1:00:56 } +2024-07-30 05:08:52,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 542/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 1.862334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:52,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.66026 samples/s/p 1:00:50 } +2024-07-30 05:08:55,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 544/ 3125], loss: 0.156, per_step_time: 1412ms, lr: 1.859645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:55,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.66207 samples/s/p 1:00:46 } +2024-07-30 05:08:58,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 546/ 3125], loss: 0.244, per_step_time: 1412ms, lr: 1.8569565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:08:58,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.66177 samples/s/p 1:00:44 } +2024-07-30 05:09:01,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 548/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 1.8542704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:01,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.66119 samples/s/p 1:00:41 } +2024-07-30 05:09:04,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 550/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 1.8515858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:04,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.66126 samples/s/p 1:00:38 } +2024-07-30 05:09:07,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 552/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 1.8489027e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:07,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.66135 samples/s/p 1:00:35 } +2024-07-30 05:09:09,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 554/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 1.8462214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:09,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.66039 samples/s/p 1:00:33 } +2024-07-30 05:09:12,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 556/ 3125], loss: 0.197, per_step_time: 1412ms, lr: 1.8435412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:12,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.66184 samples/s/p 1:00:29 } +2024-07-30 05:09:15,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 558/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 1.8408629e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:15,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.65970 samples/s/p 1:00:28 } +2024-07-30 05:09:18,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 560/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 1.8381849e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:18,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.65668 samples/s/p 1:00:27 } +2024-07-30 05:09:21,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 562/ 3125], loss: 0.268, per_step_time: 1416ms, lr: 1.8355095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:21,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.64605 samples/s/p 1:00:31 } +2024-07-30 05:09:24,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 564/ 3125], loss: 0.274, per_step_time: 1413ms, lr: 1.8328357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:24,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.65964 samples/s/p 1:00:20 } +2024-07-30 05:09:26,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 566/ 3125], loss: 0.185, per_step_time: 1412ms, lr: 1.8301621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:26,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.66186 samples/s/p 1:00:15 } +2024-07-30 05:09:29,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 568/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 1.8274911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:29,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.65965 samples/s/p 1:00:14 } +2024-07-30 05:09:32,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 570/ 3125], loss: 0.294, per_step_time: 1413ms, lr: 1.8248218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:32,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.66163 samples/s/p 1:00:10 } +2024-07-30 05:09:35,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 572/ 3125], loss: 0.232, per_step_time: 1414ms, lr: 1.8221535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:35,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.65749 samples/s/p 1:00:10 } +2024-07-30 05:09:38,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 574/ 3125], loss: 0.064, per_step_time: 1414ms, lr: 1.8194863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:38,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.65758 samples/s/p 1:00:07 } +2024-07-30 05:09:41,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 576/ 3125], loss: 0.174, per_step_time: 1414ms, lr: 1.8168216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:41,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.65749 samples/s/p 1:00:04 } +2024-07-30 05:09:43,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 578/ 3125], loss: 0.265, per_step_time: 1415ms, lr: 1.8141582e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:43,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.65331 samples/s/p 1:00:04 } +2024-07-30 05:09:46,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 580/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 1.8114963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:46,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.65979 samples/s/p 0:59:57 } +2024-07-30 05:09:49,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 582/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 1.8088361e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:49,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.65999 samples/s/p 0:59:54 } +2024-07-30 05:09:52,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 584/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 1.8061771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:52,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.66020 samples/s/p 0:59:51 } +2024-07-30 05:09:55,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 586/ 3125], loss: 0.202, per_step_time: 1414ms, lr: 1.8035188e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:55,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.65604 samples/s/p 0:59:51 } +2024-07-30 05:09:58,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 588/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 1.8008631e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:09:58,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.66035 samples/s/p 0:59:45 } +2024-07-30 05:10:00,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 590/ 3125], loss: 0.138, per_step_time: 1415ms, lr: 1.798208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:00,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.65241 samples/s/p 0:59:47 } +2024-07-30 05:10:03,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 592/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 1.7955554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:03,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.65786 samples/s/p 0:59:41 } +2024-07-30 05:10:06,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 594/ 3125], loss: 0.130, per_step_time: 1413ms, lr: 1.7929044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:06,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.65951 samples/s/p 0:59:37 } +2024-07-30 05:10:09,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 596/ 3125], loss: 0.277, per_step_time: 1412ms, lr: 1.7902544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:09,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.66173 samples/s/p 0:59:33 } +2024-07-30 05:10:12,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 598/ 3125], loss: 0.323, per_step_time: 1413ms, lr: 1.7876064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:12,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.66105 samples/s/p 0:59:31 } +2024-07-30 05:10:15,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 600/ 3125], loss: 0.395, per_step_time: 1413ms, lr: 1.7849596e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:15,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.66020 samples/s/p 0:59:28 } +2024-07-30 05:10:17,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 602/ 3125], loss: 0.266, per_step_time: 1414ms, lr: 1.7823138e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:17,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.65665 samples/s/p 0:59:28 } +2024-07-30 05:10:20,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 604/ 3125], loss: 0.134, per_step_time: 1413ms, lr: 1.7796704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:20,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.65891 samples/s/p 0:59:23 } +2024-07-30 05:10:23,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 606/ 3125], loss: 0.142, per_step_time: 1413ms, lr: 1.7770287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:23,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.65882 samples/s/p 0:59:21 } +2024-07-30 05:10:26,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 608/ 3125], loss: 0.591, per_step_time: 1413ms, lr: 1.7743882e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:26,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.65920 samples/s/p 0:59:18 } +2024-07-30 05:10:29,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 610/ 3125], loss: 0.108, per_step_time: 1414ms, lr: 1.771748e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:29,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.65724 samples/s/p 0:59:16 } +2024-07-30 05:10:32,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 612/ 3125], loss: 0.229, per_step_time: 1415ms, lr: 1.7691108e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:32,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.65224 samples/s/p 0:59:16 } +2024-07-30 05:10:34,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 614/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 1.7664751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:34,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.66099 samples/s/p 0:59:08 } +2024-07-30 05:10:37,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 616/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 1.7638399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:37,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.65888 samples/s/p 0:59:06 } +2024-07-30 05:10:40,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 618/ 3125], loss: 0.164, per_step_time: 1413ms, lr: 1.7612073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:40,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.65805 samples/s/p 0:59:04 } +2024-07-30 05:10:43,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 620/ 3125], loss: 0.065, per_step_time: 1412ms, lr: 1.758576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:43,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.66243 samples/s/p 0:58:59 } +2024-07-30 05:10:46,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 622/ 3125], loss: 0.277, per_step_time: 1412ms, lr: 1.7559465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:46,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.66190 samples/s/p 0:58:56 } +2024-07-30 05:10:49,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 624/ 3125], loss: 0.520, per_step_time: 1413ms, lr: 1.7533185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:49,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.66023 samples/s/p 0:58:54 } +2024-07-30 05:10:51,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 626/ 3125], loss: 0.100, per_step_time: 1413ms, lr: 1.750692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:51,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.65983 samples/s/p 0:58:52 } +2024-07-30 05:10:54,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 628/ 3125], loss: 0.372, per_step_time: 1412ms, lr: 1.7480671e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:54,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.66175 samples/s/p 0:58:48 } +2024-07-30 05:10:57,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 630/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 1.7454427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:10:57,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.65939 samples/s/p 0:58:46 } +2024-07-30 05:11:00,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 632/ 3125], loss: 0.305, per_step_time: 1415ms, lr: 1.7428207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:00,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.65258 samples/s/p 0:58:48 } +2024-07-30 05:11:03,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 634/ 3125], loss: 0.278, per_step_time: 1415ms, lr: 1.7401995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:03,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.65151 samples/s/p 0:58:46 } +2024-07-30 05:11:06,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 636/ 3125], loss: 0.082, per_step_time: 1412ms, lr: 1.7375809e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:06,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.66187 samples/s/p 0:58:36 } +2024-07-30 05:11:08,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 638/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 1.7349636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:08,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.65979 samples/s/p 0:58:35 } +2024-07-30 05:11:11,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 640/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 1.7323479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:11,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.66160 samples/s/p 0:58:31 } +2024-07-30 05:11:14,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 642/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 1.7297339e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:14,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.66116 samples/s/p 0:58:28 } +2024-07-30 05:11:17,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 644/ 3125], loss: 0.400, per_step_time: 1413ms, lr: 1.7271215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:17,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.66030 samples/s/p 0:58:26 } +2024-07-30 05:11:20,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 646/ 3125], loss: 0.298, per_step_time: 1412ms, lr: 1.7245095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:20,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.66191 samples/s/p 0:58:22 } +2024-07-30 05:11:23,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 648/ 3125], loss: 0.312, per_step_time: 1413ms, lr: 1.7219004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:23,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.65949 samples/s/p 0:58:21 } +2024-07-30 05:11:25,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 650/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 1.7192924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:25,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.65932 samples/s/p 0:58:18 } +2024-07-30 05:11:28,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 652/ 3125], loss: 0.326, per_step_time: 1414ms, lr: 1.7166861e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:28,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.65444 samples/s/p 0:58:18 } +2024-07-30 05:11:31,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 654/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 1.7140806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:31,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.66048 samples/s/p 0:58:12 } +2024-07-30 05:11:34,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 656/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 1.7114774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:34,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.66075 samples/s/p 0:58:09 } +2024-07-30 05:11:37,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 658/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 1.7088759e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:37,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.65994 samples/s/p 0:58:06 } +2024-07-30 05:11:40,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 660/ 3125], loss: 0.120, per_step_time: 1412ms, lr: 1.706275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:40,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.66194 samples/s/p 0:58:02 } +2024-07-30 05:11:42,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 662/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 1.7036765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:42,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.66024 samples/s/p 0:58:01 } +2024-07-30 05:11:45,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 664/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 1.7010799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:45,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.65900 samples/s/p 0:57:59 } +2024-07-30 05:11:48,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 666/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 1.6984844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:48,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.65870 samples/s/p 0:57:56 } +2024-07-30 05:11:51,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 668/ 3125], loss: 0.145, per_step_time: 1413ms, lr: 1.695891e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:51,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.65896 samples/s/p 0:57:53 } +2024-07-30 05:11:54,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 670/ 3125], loss: 0.207, per_step_time: 1414ms, lr: 1.6932988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:54,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.65729 samples/s/p 0:57:51 } +2024-07-30 05:11:57,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 672/ 3125], loss: 0.271, per_step_time: 1415ms, lr: 1.690708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:57,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.65014 samples/s/p 0:57:53 } +2024-07-30 05:11:59,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 674/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 1.6881182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:11:59,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.66039 samples/s/p 0:57:44 } +2024-07-30 05:12:02,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 676/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 1.6855311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:02,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.65779 samples/s/p 0:57:42 } +2024-07-30 05:12:05,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 678/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 1.6829442e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:05,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.66118 samples/s/p 0:57:37 } +2024-07-30 05:12:08,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 680/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 1.6803601e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:08,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.66035 samples/s/p 0:57:35 } +2024-07-30 05:12:11,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 682/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 1.6777774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:11,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.65771 samples/s/p 0:57:34 } +2024-07-30 05:12:14,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 684/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 1.6751966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:14,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |████████████████████████████████████ | 5.66085 samples/s/p 0:57:29 } +2024-07-30 05:12:16,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 686/ 3125], loss: 0.592, per_step_time: 1413ms, lr: 1.6726168e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:16,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |████████████████████████████████████ | 5.66127 samples/s/p 0:57:26 } +2024-07-30 05:12:19,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 688/ 3125], loss: 0.160, per_step_time: 1413ms, lr: 1.670038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:19,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.66061 samples/s/p 0:57:24 } +2024-07-30 05:12:22,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 690/ 3125], loss: 0.201, per_step_time: 1414ms, lr: 1.6674619e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:22,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.65647 samples/s/p 0:57:23 } +2024-07-30 05:12:25,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 692/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 1.6648873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:25,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.66101 samples/s/p 0:57:18 } +2024-07-30 05:12:28,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 694/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 1.6623145e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:28,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.66142 samples/s/p 0:57:15 } +2024-07-30 05:12:31,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 696/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 1.6597429e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:31,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.66158 samples/s/p 0:57:12 } +2024-07-30 05:12:33,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 698/ 3125], loss: 0.281, per_step_time: 1413ms, lr: 1.657173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:33,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.66147 samples/s/p 0:57:09 } +2024-07-30 05:12:36,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 700/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 1.6546037e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:36,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.65995 samples/s/p 0:57:07 } +2024-07-30 05:12:39,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 702/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 1.6520369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:39,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.65865 samples/s/p 0:57:05 } +2024-07-30 05:12:42,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 704/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 1.6494708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:42,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.65891 samples/s/p 0:57:02 } +2024-07-30 05:12:45,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 706/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 1.6469075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:45,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.65845 samples/s/p 0:57:00 } +2024-07-30 05:12:48,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 708/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 1.6443457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:48,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.65748 samples/s/p 0:56:57 } +2024-07-30 05:12:50,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 710/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 1.6417855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:50,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.65924 samples/s/p 0:56:53 } +2024-07-30 05:12:53,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 712/ 3125], loss: 0.073, per_step_time: 1414ms, lr: 1.6392266e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:53,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.65756 samples/s/p 0:56:52 } +2024-07-30 05:12:56,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 714/ 3125], loss: 0.369, per_step_time: 1413ms, lr: 1.6366696e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:56,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.66171 samples/s/p 0:56:46 } +2024-07-30 05:12:59,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 716/ 3125], loss: 0.282, per_step_time: 1414ms, lr: 1.6341144e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:12:59,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.65735 samples/s/p 0:56:46 } +2024-07-30 05:13:02,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 718/ 3125], loss: 0.419, per_step_time: 1413ms, lr: 1.6315594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:02,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.66110 samples/s/p 0:56:41 } +2024-07-30 05:13:05,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 720/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 1.6290071e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:05,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.66013 samples/s/p 0:56:39 } +2024-07-30 05:13:07,991 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 722/ 3125], loss: 0.433, per_step_time: 1413ms, lr: 1.6264567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:07,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.66010 samples/s/p 0:56:36 } +2024-07-30 05:13:10,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 724/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 1.6239064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:10,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.65898 samples/s/p 0:56:34 } +2024-07-30 05:13:13,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 726/ 3125], loss: 0.217, per_step_time: 1414ms, lr: 1.6213589e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:13,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.65717 samples/s/p 0:56:32 } +2024-07-30 05:13:16,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 728/ 3125], loss: 0.267, per_step_time: 1414ms, lr: 1.6188135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:16,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.65754 samples/s/p 0:56:29 } +2024-07-30 05:13:19,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 730/ 3125], loss: 0.191, per_step_time: 1412ms, lr: 1.6162691e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:19,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.66240 samples/s/p 0:56:23 } +2024-07-30 05:13:22,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 732/ 3125], loss: 0.114, per_step_time: 1413ms, lr: 1.6137257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:22,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.65979 samples/s/p 0:56:22 } +2024-07-30 05:13:24,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 734/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 1.6111848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:24,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.65811 samples/s/p 0:56:20 } +2024-07-30 05:13:27,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 736/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 1.6086453e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:27,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.65891 samples/s/p 0:56:17 } +2024-07-30 05:13:30,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 738/ 3125], loss: 0.389, per_step_time: 1414ms, lr: 1.6061076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:30,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.65696 samples/s/p 0:56:15 } +2024-07-30 05:13:33,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 740/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 1.6035715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:33,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.65811 samples/s/p 0:56:12 } +2024-07-30 05:13:36,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 742/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 1.6010371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:36,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.66033 samples/s/p 0:56:08 } +2024-07-30 05:13:39,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 744/ 3125], loss: 0.424, per_step_time: 1413ms, lr: 1.5985032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:39,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.66066 samples/s/p 0:56:04 } +2024-07-30 05:13:42,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 746/ 3125], loss: 0.112, per_step_time: 1413ms, lr: 1.5959721e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:42,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.66084 samples/s/p 0:56:02 } +2024-07-30 05:13:44,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 748/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 1.5934413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:44,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.65972 samples/s/p 0:55:59 } +2024-07-30 05:13:47,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 750/ 3125], loss: 0.348, per_step_time: 1413ms, lr: 1.5909135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:13:47,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.66004 samples/s/p 0:55:56 } +2024-07-30 05:13:47,669 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 05:14:24,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 752/ 3125], loss: 0.167, per_step_time: 3017ms, lr: 1.5883871e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:24,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 2.65153 samples/s/p 1:59:19 } +2024-07-30 05:14:26,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 754/ 3125], loss: 0.306, per_step_time: 1414ms, lr: 1.5858626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:26,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.65500 samples/s/p 0:55:54 } +2024-07-30 05:14:29,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 756/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 1.5833392e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:29,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.65959 samples/s/p 0:55:48 } +2024-07-30 05:14:32,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 758/ 3125], loss: 0.194, per_step_time: 1414ms, lr: 1.5808176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:32,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.65588 samples/s/p 0:55:48 } +2024-07-30 05:14:35,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 760/ 3125], loss: 0.140, per_step_time: 1415ms, lr: 1.5782979e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:35,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.65107 samples/s/p 0:55:48 } +2024-07-30 05:14:38,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 762/ 3125], loss: 0.289, per_step_time: 1414ms, lr: 1.5757787e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:38,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.65434 samples/s/p 0:55:43 } +2024-07-30 05:14:41,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 764/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 1.5732625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:41,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.66119 samples/s/p 0:55:36 } +2024-07-30 05:14:44,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 766/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 1.5707475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:44,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.66157 samples/s/p 0:55:33 } +2024-07-30 05:14:47,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 768/ 3125], loss: 0.225, per_step_time: 1416ms, lr: 1.5682333e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:47,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.64652 samples/s/p 0:55:39 } +2024-07-30 05:14:50,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 770/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 1.5657216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:50,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.66130 samples/s/p 0:55:27 } +2024-07-30 05:14:53,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 772/ 3125], loss: 0.538, per_step_time: 1414ms, lr: 1.5632113e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:53,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.65714 samples/s/p 0:55:27 } +2024-07-30 05:14:55,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 774/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 1.5607031e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:55,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.66000 samples/s/p 0:55:22 } +2024-07-30 05:14:58,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 776/ 3125], loss: 0.176, per_step_time: 1412ms, lr: 1.5581957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:14:58,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.66172 samples/s/p 0:55:19 } +2024-07-30 05:15:01,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 778/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 1.5556905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:01,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.65966 samples/s/p 0:55:17 } +2024-07-30 05:15:04,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 780/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 1.5531871e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:04,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.65882 samples/s/p 0:55:15 } +2024-07-30 05:15:07,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 782/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 1.5506852e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:07,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.66029 samples/s/p 0:55:11 } +2024-07-30 05:15:10,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 784/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 1.548185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:10,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.66159 samples/s/p 0:55:07 } +2024-07-30 05:15:13,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 786/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 1.5456867e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:13,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.65976 samples/s/p 0:55:06 } +2024-07-30 05:15:16,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 788/ 3125], loss: 0.313, per_step_time: 1414ms, lr: 1.543189e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:16,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.65576 samples/s/p 0:55:05 } +2024-07-30 05:15:19,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 790/ 3125], loss: 0.309, per_step_time: 1414ms, lr: 1.5406936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:19,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.65486 samples/s/p 0:55:03 } +2024-07-30 05:15:22,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 792/ 3125], loss: 0.243, per_step_time: 1414ms, lr: 1.5381992e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:22,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.65757 samples/s/p 0:54:58 } +2024-07-30 05:15:24,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 794/ 3125], loss: 0.405, per_step_time: 1413ms, lr: 1.5357074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:24,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.66072 samples/s/p 0:54:54 } +2024-07-30 05:15:27,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 796/ 3125], loss: 0.059, per_step_time: 1414ms, lr: 1.5332171e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:27,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.65403 samples/s/p 0:54:55 } +2024-07-30 05:15:30,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 798/ 3125], loss: 0.459, per_step_time: 1415ms, lr: 1.5307284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:30,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.65346 samples/s/p 0:54:52 } +2024-07-30 05:15:33,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 800/ 3125], loss: 0.366, per_step_time: 1413ms, lr: 1.5282416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:33,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.65782 samples/s/p 0:54:47 } +2024-07-30 05:15:36,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 802/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 1.525756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:36,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.65856 samples/s/p 0:54:44 } +2024-07-30 05:15:39,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 804/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 1.5232717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:39,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.66030 samples/s/p 0:54:40 } +2024-07-30 05:15:42,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 806/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 1.5207895e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:42,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.66043 samples/s/p 0:54:37 } +2024-07-30 05:15:44,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 808/ 3125], loss: 0.235, per_step_time: 1414ms, lr: 1.5183094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:44,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.65615 samples/s/p 0:54:37 } +2024-07-30 05:15:47,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 810/ 3125], loss: 0.235, per_step_time: 1413ms, lr: 1.5158307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:47,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.65937 samples/s/p 0:54:32 } +2024-07-30 05:15:50,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 812/ 3125], loss: 0.385, per_step_time: 1413ms, lr: 1.5133529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:50,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.66091 samples/s/p 0:54:28 } +2024-07-30 05:15:53,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 814/ 3125], loss: 0.359, per_step_time: 1414ms, lr: 1.5108776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:53,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.65765 samples/s/p 0:54:27 } +2024-07-30 05:15:56,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 816/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 1.508404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:56,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.65889 samples/s/p 0:54:24 } +2024-07-30 05:15:59,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 818/ 3125], loss: 0.181, per_step_time: 1418ms, lr: 1.5059313e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:15:59,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.63879 samples/s/p 0:54:33 } +2024-07-30 05:16:01,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 820/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 1.5034607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:01,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.66064 samples/s/p 0:54:17 } +2024-07-30 05:16:04,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 822/ 3125], loss: 0.343, per_step_time: 1415ms, lr: 1.5009921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:04,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.65090 samples/s/p 0:54:20 } +2024-07-30 05:16:07,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 824/ 3125], loss: 0.420, per_step_time: 1413ms, lr: 1.4985251e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:07,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.66125 samples/s/p 0:54:11 } +2024-07-30 05:16:10,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 826/ 3125], loss: 0.120, per_step_time: 1415ms, lr: 1.4960599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:10,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.65316 samples/s/p 0:54:13 } +2024-07-30 05:16:13,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 828/ 3125], loss: 0.141, per_step_time: 1415ms, lr: 1.4935964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:13,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.64994 samples/s/p 0:54:12 } +2024-07-30 05:16:16,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 830/ 3125], loss: 0.413, per_step_time: 1414ms, lr: 1.4911344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:16,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.65529 samples/s/p 0:54:06 } +2024-07-30 05:16:18,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 832/ 3125], loss: 0.234, per_step_time: 1415ms, lr: 1.4886731e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:18,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.65370 samples/s/p 0:54:04 } +2024-07-30 05:16:21,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 834/ 3125], loss: 0.438, per_step_time: 1412ms, lr: 1.4862144e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:21,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.66331 samples/s/p 0:53:56 } +2024-07-30 05:16:24,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 836/ 3125], loss: 0.238, per_step_time: 1412ms, lr: 1.4837568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:24,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.66243 samples/s/p 0:53:53 } +2024-07-30 05:16:27,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 838/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 1.4813014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:27,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.66081 samples/s/p 0:53:52 } +2024-07-30 05:16:30,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 840/ 3125], loss: 0.145, per_step_time: 1413ms, lr: 1.4788482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:30,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.65815 samples/s/p 0:53:50 } +2024-07-30 05:16:33,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 842/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 1.4763963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:33,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.66073 samples/s/p 0:53:46 } +2024-07-30 05:16:35,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 844/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 1.473946e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:35,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.65859 samples/s/p 0:53:44 } +2024-07-30 05:16:38,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 846/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 1.4714974e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:38,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.66057 samples/s/p 0:53:40 } +2024-07-30 05:16:41,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 848/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 1.4690497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:41,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.66090 samples/s/p 0:53:37 } +2024-07-30 05:16:44,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 850/ 3125], loss: 0.104, per_step_time: 1413ms, lr: 1.4666044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:44,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.66044 samples/s/p 0:53:35 } +2024-07-30 05:16:47,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 852/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 1.4641612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:47,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.66054 samples/s/p 0:53:32 } +2024-07-30 05:16:50,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 854/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 1.4617192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:50,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.65909 samples/s/p 0:53:30 } +2024-07-30 05:16:52,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 856/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 1.4592785e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:52,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.66133 samples/s/p 0:53:26 } +2024-07-30 05:16:55,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 858/ 3125], loss: 0.118, per_step_time: 1412ms, lr: 1.45684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:55,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.66248 samples/s/p 0:53:22 } +2024-07-30 05:16:58,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 860/ 3125], loss: 0.421, per_step_time: 1413ms, lr: 1.4544033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:16:58,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.66014 samples/s/p 0:53:21 } +2024-07-30 05:17:01,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 862/ 3125], loss: 0.449, per_step_time: 1413ms, lr: 1.4519674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:01,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.65811 samples/s/p 0:53:19 } +2024-07-30 05:17:04,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 864/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 1.4495342e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:04,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.66024 samples/s/p 0:53:15 } +2024-07-30 05:17:07,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 866/ 3125], loss: 0.387, per_step_time: 1415ms, lr: 1.4471024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:07,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.65228 samples/s/p 0:53:17 } +2024-07-30 05:17:09,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 868/ 3125], loss: 0.226, per_step_time: 1413ms, lr: 1.4446726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:09,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.65804 samples/s/p 0:53:11 } +2024-07-30 05:17:12,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 870/ 3125], loss: 0.101, per_step_time: 1416ms, lr: 1.4422443e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:12,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.64796 samples/s/p 0:53:14 } +2024-07-30 05:17:15,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 872/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 1.4398178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:15,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |█████████████████████████████████████ | 5.66027 samples/s/p 0:53:04 } +2024-07-30 05:17:18,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 874/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 1.4373928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:18,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |█████████████████████████████████████ | 5.66094 samples/s/p 0:53:01 } +2024-07-30 05:17:21,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 876/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 1.434969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:21,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.66055 samples/s/p 0:52:58 } +2024-07-30 05:17:24,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 878/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 1.4325475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:24,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.65987 samples/s/p 0:52:56 } +2024-07-30 05:17:26,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 880/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 1.430127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:26,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.66138 samples/s/p 0:52:52 } +2024-07-30 05:17:29,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 882/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 1.4277089e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:29,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.65952 samples/s/p 0:52:50 } +2024-07-30 05:17:32,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 884/ 3125], loss: 0.320, per_step_time: 1413ms, lr: 1.4252928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:32,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.65940 samples/s/p 0:52:47 } +2024-07-30 05:17:35,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 886/ 3125], loss: 0.484, per_step_time: 1413ms, lr: 1.4228782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:35,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.66058 samples/s/p 0:52:44 } +2024-07-30 05:17:38,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 888/ 3125], loss: 0.222, per_step_time: 1414ms, lr: 1.4204651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:38,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.65524 samples/s/p 0:52:44 } +2024-07-30 05:17:41,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 890/ 3125], loss: 0.181, per_step_time: 1412ms, lr: 1.4180529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:41,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.66272 samples/s/p 0:52:37 } +2024-07-30 05:17:43,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 892/ 3125], loss: 0.288, per_step_time: 1414ms, lr: 1.4156436e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:43,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.65540 samples/s/p 0:52:38 } +2024-07-30 05:17:46,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 894/ 3125], loss: 0.214, per_step_time: 1413ms, lr: 1.413236e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:46,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.65821 samples/s/p 0:52:34 } +2024-07-30 05:17:49,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 896/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 1.41083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:49,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.65946 samples/s/p 0:52:30 } +2024-07-30 05:17:52,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 898/ 3125], loss: 0.380, per_step_time: 1413ms, lr: 1.4084255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:52,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.66061 samples/s/p 0:52:27 } +2024-07-30 05:17:55,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 900/ 3125], loss: 0.492, per_step_time: 1415ms, lr: 1.406022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:55,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.65333 samples/s/p 0:52:28 } +2024-07-30 05:17:58,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 902/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 1.4036211e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:17:58,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.66110 samples/s/p 0:52:21 } +2024-07-30 05:18:00,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 904/ 3125], loss: 0.187, per_step_time: 1415ms, lr: 1.401222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:00,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.65112 samples/s/p 0:52:24 } +2024-07-30 05:18:03,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 906/ 3125], loss: 0.287, per_step_time: 1414ms, lr: 1.3988235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:03,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.65466 samples/s/p 0:52:19 } +2024-07-30 05:18:06,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 908/ 3125], loss: 0.194, per_step_time: 1414ms, lr: 1.396428e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:06,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.65665 samples/s/p 0:52:15 } +2024-07-30 05:18:09,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 910/ 3125], loss: 0.370, per_step_time: 1414ms, lr: 1.3940337e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:09,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.65726 samples/s/p 0:52:12 } +2024-07-30 05:18:12,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 912/ 3125], loss: 0.139, per_step_time: 1414ms, lr: 1.3916415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:12,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.65686 samples/s/p 0:52:09 } +2024-07-30 05:18:15,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 914/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 1.389251e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:15,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.65996 samples/s/p 0:52:05 } +2024-07-30 05:18:17,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 916/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 1.3868621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:17,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.65973 samples/s/p 0:52:02 } +2024-07-30 05:18:20,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 918/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 1.3844749e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:20,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.65990 samples/s/p 0:51:59 } +2024-07-30 05:18:23,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 920/ 3125], loss: 0.399, per_step_time: 1413ms, lr: 1.3820886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:23,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.66051 samples/s/p 0:51:56 } +2024-07-30 05:18:26,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 922/ 3125], loss: 0.454, per_step_time: 1413ms, lr: 1.379705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:26,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.65942 samples/s/p 0:51:54 } +2024-07-30 05:18:29,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 924/ 3125], loss: 0.369, per_step_time: 1412ms, lr: 1.3773221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:29,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.66175 samples/s/p 0:51:49 } +2024-07-30 05:18:32,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 926/ 3125], loss: 0.270, per_step_time: 1412ms, lr: 1.374942e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:32,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.66232 samples/s/p 0:51:46 } +2024-07-30 05:18:34,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 928/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 1.3725635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:34,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.65942 samples/s/p 0:51:45 } +2024-07-30 05:18:37,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 930/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 1.3701865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:37,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.66106 samples/s/p 0:51:41 } +2024-07-30 05:18:40,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 932/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 1.3678115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:40,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.65854 samples/s/p 0:51:40 } +2024-07-30 05:18:43,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 934/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 1.3654375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:43,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.65793 samples/s/p 0:51:37 } +2024-07-30 05:18:46,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 936/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 1.3630661e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:46,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.65853 samples/s/p 0:51:34 } +2024-07-30 05:18:49,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 938/ 3125], loss: 0.381, per_step_time: 1414ms, lr: 1.3606963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:49,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.65672 samples/s/p 0:51:32 } +2024-07-30 05:18:51,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 940/ 3125], loss: 0.368, per_step_time: 1413ms, lr: 1.3583282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:51,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.65832 samples/s/p 0:51:29 } +2024-07-30 05:18:54,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 942/ 3125], loss: 0.351, per_step_time: 1413ms, lr: 1.3559616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:54,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.66034 samples/s/p 0:51:25 } +2024-07-30 05:18:57,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 944/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 1.3535961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:18:57,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.65789 samples/s/p 0:51:23 } +2024-07-30 05:19:00,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 946/ 3125], loss: 0.322, per_step_time: 1413ms, lr: 1.3512334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:00,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.66087 samples/s/p 0:51:19 } +2024-07-30 05:19:03,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 948/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 1.3488716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:03,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.66149 samples/s/p 0:51:16 } +2024-07-30 05:19:06,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 950/ 3125], loss: 0.323, per_step_time: 1416ms, lr: 1.3465121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:06,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.64592 samples/s/p 0:51:21 } +2024-07-30 05:19:08,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 952/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 1.3441542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:08,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.65936 samples/s/p 0:51:11 } +2024-07-30 05:19:11,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 954/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 1.3417986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:11,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.65988 samples/s/p 0:51:08 } +2024-07-30 05:19:14,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 956/ 3125], loss: 0.491, per_step_time: 1413ms, lr: 1.3394442e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:14,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.65890 samples/s/p 0:51:06 } +2024-07-30 05:19:17,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 958/ 3125], loss: 0.460, per_step_time: 1413ms, lr: 1.3370919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:17,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.65881 samples/s/p 0:51:03 } +2024-07-30 05:19:20,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 960/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 1.3347413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:20,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.65860 samples/s/p 0:51:00 } +2024-07-30 05:19:23,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 962/ 3125], loss: 0.367, per_step_time: 1413ms, lr: 1.3323923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:23,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.65928 samples/s/p 0:50:57 } +2024-07-30 05:19:25,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 964/ 3125], loss: 0.162, per_step_time: 1414ms, lr: 1.3300445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:25,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.65547 samples/s/p 0:50:56 } +2024-07-30 05:19:28,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 966/ 3125], loss: 0.299, per_step_time: 1412ms, lr: 1.3276988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:28,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.66196 samples/s/p 0:50:50 } +2024-07-30 05:19:31,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 968/ 3125], loss: 0.222, per_step_time: 1414ms, lr: 1.3253546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:31,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.65650 samples/s/p 0:50:50 } +2024-07-30 05:19:34,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 970/ 3125], loss: 0.281, per_step_time: 1412ms, lr: 1.3230127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:34,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.66186 samples/s/p 0:50:44 } +2024-07-30 05:19:37,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 972/ 3125], loss: 0.278, per_step_time: 1414ms, lr: 1.3206726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:37,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.65716 samples/s/p 0:50:44 } +2024-07-30 05:19:40,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 974/ 3125], loss: 0.165, per_step_time: 1415ms, lr: 1.3183341e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:40,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.65263 samples/s/p 0:50:44 } +2024-07-30 05:19:42,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 976/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 1.3159975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:42,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.66111 samples/s/p 0:50:36 } +2024-07-30 05:19:45,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 978/ 3125], loss: 0.212, per_step_time: 1415ms, lr: 1.3136619e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:45,808 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.65204 samples/s/p 0:50:38 } +2024-07-30 05:19:48,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 980/ 3125], loss: 0.332, per_step_time: 1416ms, lr: 1.3113287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:48,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.64595 samples/s/p 0:50:39 } +2024-07-30 05:19:51,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 982/ 3125], loss: 0.478, per_step_time: 1414ms, lr: 1.3089972e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:51,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.65466 samples/s/p 0:50:31 } +2024-07-30 05:19:54,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 984/ 3125], loss: 0.330, per_step_time: 1413ms, lr: 1.3066679e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:54,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.66157 samples/s/p 0:50:25 } +2024-07-30 05:19:57,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 986/ 3125], loss: 0.351, per_step_time: 1414ms, lr: 1.30434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:57,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.65688 samples/s/p 0:50:24 } +2024-07-30 05:19:59,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 988/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 1.302014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:19:59,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.65926 samples/s/p 0:50:20 } +2024-07-30 05:20:02,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 990/ 3125], loss: 0.295, per_step_time: 1412ms, lr: 1.2996887e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:02,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.66234 samples/s/p 0:50:16 } +2024-07-30 05:20:05,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 992/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 1.2973654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:05,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.65932 samples/s/p 0:50:15 } +2024-07-30 05:20:08,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 994/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 1.2950447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:08,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.65924 samples/s/p 0:50:12 } +2024-07-30 05:20:11,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 996/ 3125], loss: 0.069, per_step_time: 1413ms, lr: 1.2927258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:11,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.66040 samples/s/p 0:50:08 } +2024-07-30 05:20:14,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 998/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 1.2904086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:14,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.65997 samples/s/p 0:50:06 } +2024-07-30 05:20:16,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1000/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 1.288093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:16,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.66120 samples/s/p 0:50:02 } +2024-07-30 05:20:19,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1002/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 1.2857795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:19,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.66047 samples/s/p 0:50:00 } +2024-07-30 05:20:22,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1004/ 3125], loss: 0.308, per_step_time: 1412ms, lr: 1.2834673e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:22,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.66247 samples/s/p 0:49:56 } +2024-07-30 05:20:25,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1006/ 3125], loss: 0.276, per_step_time: 1415ms, lr: 1.2811565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:25,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.65056 samples/s/p 0:50:00 } +2024-07-30 05:20:28,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1008/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 1.2788483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:28,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.65984 samples/s/p 0:49:52 } +2024-07-30 05:20:31,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1010/ 3125], loss: 0.185, per_step_time: 1413ms, lr: 1.2765416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:31,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.66115 samples/s/p 0:49:48 } +2024-07-30 05:20:33,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1012/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 1.2742358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:33,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.65873 samples/s/p 0:49:47 } +2024-07-30 05:20:36,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1014/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 1.271933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:36,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.65629 samples/s/p 0:49:45 } +2024-07-30 05:20:39,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1016/ 3125], loss: 0.141, per_step_time: 1414ms, lr: 1.2696316e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:39,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.65756 samples/s/p 0:49:42 } +2024-07-30 05:20:42,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1018/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 1.2673321e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:42,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.65923 samples/s/p 0:49:38 } +2024-07-30 05:20:45,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1020/ 3125], loss: 0.304, per_step_time: 1414ms, lr: 1.2650338e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:45,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.65662 samples/s/p 0:49:37 } +2024-07-30 05:20:48,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1022/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 1.2627381e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:48,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.65821 samples/s/p 0:49:33 } +2024-07-30 05:20:51,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1024/ 3125], loss: 0.189, per_step_time: 1414ms, lr: 1.2604439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:51,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.65565 samples/s/p 0:49:31 } +2024-07-30 05:20:53,840 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1026/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 1.2581515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:53,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.66108 samples/s/p 0:49:26 } +2024-07-30 05:20:56,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1028/ 3125], loss: 0.138, per_step_time: 1415ms, lr: 1.2558612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:56,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.65218 samples/s/p 0:49:28 } +2024-07-30 05:20:59,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1030/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 1.2535721e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:20:59,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.66125 samples/s/p 0:49:20 } +2024-07-30 05:21:02,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1032/ 3125], loss: 0.270, per_step_time: 1414ms, lr: 1.2512851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:02,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.65525 samples/s/p 0:49:20 } +2024-07-30 05:21:05,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1034/ 3125], loss: 0.368, per_step_time: 1413ms, lr: 1.2489995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:05,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.66080 samples/s/p 0:49:15 } +2024-07-30 05:21:08,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1036/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 1.2467151e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:08,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.65976 samples/s/p 0:49:12 } +2024-07-30 05:21:10,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1038/ 3125], loss: 0.411, per_step_time: 1413ms, lr: 1.2444335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:10,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.66087 samples/s/p 0:49:09 } +2024-07-30 05:21:13,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1040/ 3125], loss: 0.436, per_step_time: 1412ms, lr: 1.2421536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:13,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.66191 samples/s/p 0:49:06 } +2024-07-30 05:21:16,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1042/ 3125], loss: 0.456, per_step_time: 1413ms, lr: 1.2398758e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:16,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.65868 samples/s/p 0:49:04 } +2024-07-30 05:21:19,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1044/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 1.2375996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:19,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.65889 samples/s/p 0:49:01 } +2024-07-30 05:21:22,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1046/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 1.2353253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:22,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.66112 samples/s/p 0:48:57 } +2024-07-30 05:21:25,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1048/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 1.2330526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:25,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.65846 samples/s/p 0:48:56 } +2024-07-30 05:21:27,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1050/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 1.2307808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:27,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.66157 samples/s/p 0:48:52 } +2024-07-30 05:21:30,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1052/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 1.2285119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:30,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.65922 samples/s/p 0:48:50 } +2024-07-30 05:21:33,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1054/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 1.2262445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:33,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.66033 samples/s/p 0:48:47 } +2024-07-30 05:21:36,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1056/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 1.2239792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:36,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.65860 samples/s/p 0:48:45 } +2024-07-30 05:21:39,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1058/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 1.2217149e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:39,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.65911 samples/s/p 0:48:42 } +2024-07-30 05:21:42,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1060/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 1.2194532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:42,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.66102 samples/s/p 0:48:38 } +2024-07-30 05:21:44,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1062/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 1.2171932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:44,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.65986 samples/s/p 0:48:35 } +2024-07-30 05:21:47,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1064/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 1.214934e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:47,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |███████████████████████████████████████ | 5.65995 samples/s/p 0:48:33 } +2024-07-30 05:21:50,521 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1066/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 1.2126776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:50,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |███████████████████████████████████████ | 5.66002 samples/s/p 0:48:30 } +2024-07-30 05:21:53,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1068/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 1.2104231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:53,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.65883 samples/s/p 0:48:28 } +2024-07-30 05:21:56,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1070/ 3125], loss: 0.186, per_step_time: 1413ms, lr: 1.2081704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:56,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.65969 samples/s/p 0:48:24 } +2024-07-30 05:21:59,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1072/ 3125], loss: 0.303, per_step_time: 1414ms, lr: 1.2059196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:21:59,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.65643 samples/s/p 0:48:23 } +2024-07-30 05:22:01,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1074/ 3125], loss: 0.290, per_step_time: 1414ms, lr: 1.2036704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:01,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.65431 samples/s/p 0:48:21 } +2024-07-30 05:22:04,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1076/ 3125], loss: 0.046, per_step_time: 1413ms, lr: 1.2014228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:04,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.66149 samples/s/p 0:48:15 } +2024-07-30 05:22:07,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1078/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 1.1991766e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:07,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.66018 samples/s/p 0:48:13 } +2024-07-30 05:22:10,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1080/ 3125], loss: 0.406, per_step_time: 1415ms, lr: 1.1969328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:10,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.65263 samples/s/p 0:48:14 } +2024-07-30 05:22:13,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1082/ 3125], loss: 0.318, per_step_time: 1414ms, lr: 1.1946902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:13,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.65710 samples/s/p 0:48:09 } +2024-07-30 05:22:16,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1084/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 1.1924502e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:16,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.66122 samples/s/p 0:48:04 } +2024-07-30 05:22:18,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1086/ 3125], loss: 0.321, per_step_time: 1412ms, lr: 1.1902121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:18,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.66209 samples/s/p 0:48:00 } +2024-07-30 05:22:21,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1088/ 3125], loss: 0.171, per_step_time: 1415ms, lr: 1.1879754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:21,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.65252 samples/s/p 0:48:02 } +2024-07-30 05:22:24,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1090/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 1.1857411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:24,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.65819 samples/s/p 0:47:57 } +2024-07-30 05:22:27,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1092/ 3125], loss: 0.198, per_step_time: 1414ms, lr: 1.1835074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:27,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.65553 samples/s/p 0:47:55 } +2024-07-30 05:22:30,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1094/ 3125], loss: 0.198, per_step_time: 1412ms, lr: 1.1812764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:30,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.66185 samples/s/p 0:47:49 } +2024-07-30 05:22:33,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1096/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 1.1790472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:33,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.66121 samples/s/p 0:47:47 } +2024-07-30 05:22:35,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1098/ 3125], loss: 0.470, per_step_time: 1413ms, lr: 1.1768198e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:35,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.65842 samples/s/p 0:47:45 } +2024-07-30 05:22:38,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1100/ 3125], loss: 0.447, per_step_time: 1414ms, lr: 1.1745944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:38,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.65516 samples/s/p 0:47:44 } +2024-07-30 05:22:41,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1102/ 3125], loss: 0.428, per_step_time: 1413ms, lr: 1.1723699e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:41,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.66120 samples/s/p 0:47:38 } +2024-07-30 05:22:44,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1104/ 3125], loss: 0.231, per_step_time: 1412ms, lr: 1.1701483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:44,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.66231 samples/s/p 0:47:35 } +2024-07-30 05:22:47,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1106/ 3125], loss: 0.515, per_step_time: 1413ms, lr: 1.167928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:47,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.65946 samples/s/p 0:47:33 } +2024-07-30 05:22:50,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1108/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 1.1657089e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:50,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.65902 samples/s/p 0:47:31 } +2024-07-30 05:22:52,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1110/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 1.1634928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:52,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.65881 samples/s/p 0:47:28 } +2024-07-30 05:22:55,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1112/ 3125], loss: 0.417, per_step_time: 1415ms, lr: 1.1612782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:55,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.65196 samples/s/p 0:47:29 } +2024-07-30 05:22:58,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1114/ 3125], loss: 0.305, per_step_time: 1414ms, lr: 1.1590654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:22:58,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.65383 samples/s/p 0:47:25 } +2024-07-30 05:23:01,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1116/ 3125], loss: 0.349, per_step_time: 1413ms, lr: 1.1568549e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:01,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.65802 samples/s/p 0:47:20 } +2024-07-30 05:23:04,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1118/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 1.1546457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:04,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.65965 samples/s/p 0:47:16 } +2024-07-30 05:23:07,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1120/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 1.1524385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:07,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.65823 samples/s/p 0:47:14 } +2024-07-30 05:23:09,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1122/ 3125], loss: 0.327, per_step_time: 1413ms, lr: 1.1502325e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:09,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.66068 samples/s/p 0:47:10 } +2024-07-30 05:23:12,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1124/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 1.1480287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:12,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.65958 samples/s/p 0:47:08 } +2024-07-30 05:23:15,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1126/ 3125], loss: 0.200, per_step_time: 1412ms, lr: 1.1458262e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:15,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.66193 samples/s/p 0:47:04 } +2024-07-30 05:23:18,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1128/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 1.1436265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:18,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.66004 samples/s/p 0:47:02 } +2024-07-30 05:23:21,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1130/ 3125], loss: 0.113, per_step_time: 1412ms, lr: 1.1414284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:21,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.66235 samples/s/p 0:46:58 } +2024-07-30 05:23:24,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1132/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 1.1392325e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:24,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.65964 samples/s/p 0:46:57 } +2024-07-30 05:23:26,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1134/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 1.1370381e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:26,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.65943 samples/s/p 0:46:54 } +2024-07-30 05:23:29,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1136/ 3125], loss: 0.082, per_step_time: 1412ms, lr: 1.1348446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:29,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.66172 samples/s/p 0:46:50 } +2024-07-30 05:23:32,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1138/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 1.1326542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:32,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.65818 samples/s/p 0:46:49 } +2024-07-30 05:23:35,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1140/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 1.1304655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:35,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.66064 samples/s/p 0:46:45 } +2024-07-30 05:23:38,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1142/ 3125], loss: 0.176, per_step_time: 1412ms, lr: 1.1282783e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:38,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.66196 samples/s/p 0:46:41 } +2024-07-30 05:23:41,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1144/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 1.1260936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:41,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.65642 samples/s/p 0:46:41 } +2024-07-30 05:23:43,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1146/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 1.1239093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:43,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.65939 samples/s/p 0:46:37 } +2024-07-30 05:23:46,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1148/ 3125], loss: 0.259, per_step_time: 1414ms, lr: 1.1217281e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:46,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.65682 samples/s/p 0:46:35 } +2024-07-30 05:23:49,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1150/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 1.1195477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:49,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.65883 samples/s/p 0:46:32 } +2024-07-30 05:23:52,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1152/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 1.1173704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:52,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.66016 samples/s/p 0:46:28 } +2024-07-30 05:23:55,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1154/ 3125], loss: 0.331, per_step_time: 1412ms, lr: 1.1151942e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:55,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.66172 samples/s/p 0:46:25 } +2024-07-30 05:23:58,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1156/ 3125], loss: 0.473, per_step_time: 1413ms, lr: 1.1130204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:23:58,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.66093 samples/s/p 0:46:22 } +2024-07-30 05:24:00,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1158/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 1.1108484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:00,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.65772 samples/s/p 0:46:21 } +2024-07-30 05:24:03,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1160/ 3125], loss: 0.223, per_step_time: 1416ms, lr: 1.1086782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:03,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.64580 samples/s/p 0:46:24 } +2024-07-30 05:24:06,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1162/ 3125], loss: 0.360, per_step_time: 1414ms, lr: 1.1065096e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:06,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.65639 samples/s/p 0:46:16 } +2024-07-30 05:24:09,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1164/ 3125], loss: 0.130, per_step_time: 1413ms, lr: 1.1043423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:09,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.65944 samples/s/p 0:46:12 } +2024-07-30 05:24:12,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1166/ 3125], loss: 0.140, per_step_time: 1413ms, lr: 1.1021775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:12,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.65908 samples/s/p 0:46:09 } +2024-07-30 05:24:15,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1168/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 1.1000147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:15,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.66106 samples/s/p 0:46:05 } +2024-07-30 05:24:17,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1170/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 1.0978531e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:17,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.66097 samples/s/p 0:46:02 } +2024-07-30 05:24:20,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1172/ 3125], loss: 0.636, per_step_time: 1413ms, lr: 1.0956943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:20,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.65779 samples/s/p 0:46:01 } +2024-07-30 05:24:23,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1174/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 1.0935369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:23,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.65862 samples/s/p 0:45:58 } +2024-07-30 05:24:26,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1176/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 1.0913816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:26,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.66035 samples/s/p 0:45:54 } +2024-07-30 05:24:29,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1178/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 1.0892278e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:29,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.66067 samples/s/p 0:45:51 } +2024-07-30 05:24:32,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1180/ 3125], loss: 0.293, per_step_time: 1417ms, lr: 1.0870757e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:32,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.64552 samples/s/p 0:45:56 } +2024-07-30 05:24:34,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1182/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 1.0849258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:34,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.65996 samples/s/p 0:45:46 } +2024-07-30 05:24:37,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1184/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 1.082778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:37,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.65882 samples/s/p 0:45:44 } +2024-07-30 05:24:40,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1186/ 3125], loss: 0.209, per_step_time: 1415ms, lr: 1.0806319e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:40,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.65287 samples/s/p 0:45:44 } +2024-07-30 05:24:43,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1188/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 1.0784879e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:43,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.65807 samples/s/p 0:45:38 } +2024-07-30 05:24:46,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1190/ 3125], loss: 0.440, per_step_time: 1412ms, lr: 1.0763446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:46,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.66177 samples/s/p 0:45:34 } +2024-07-30 05:24:49,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1192/ 3125], loss: 0.310, per_step_time: 1413ms, lr: 1.0742044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:49,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.65993 samples/s/p 0:45:32 } +2024-07-30 05:24:51,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1194/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 1.0720652e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:51,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.66125 samples/s/p 0:45:28 } +2024-07-30 05:24:54,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1196/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 1.0699284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:54,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.65926 samples/s/p 0:45:26 } +2024-07-30 05:24:57,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1198/ 3125], loss: 0.130, per_step_time: 1414ms, lr: 1.0677936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:24:57,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.65758 samples/s/p 0:45:24 } +2024-07-30 05:25:00,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1200/ 3125], loss: 0.418, per_step_time: 1414ms, lr: 1.0656607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:00,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.65662 samples/s/p 0:45:22 } +2024-07-30 05:25:03,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1202/ 3125], loss: 0.381, per_step_time: 1416ms, lr: 1.0635296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:03,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.64877 samples/s/p 0:45:23 } +2024-07-30 05:25:06,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1204/ 3125], loss: 0.090, per_step_time: 1413ms, lr: 1.0614004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:06,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.65997 samples/s/p 0:45:15 } +2024-07-30 05:25:08,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1206/ 3125], loss: 0.344, per_step_time: 1414ms, lr: 1.0592731e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:08,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.65376 samples/s/p 0:45:15 } +2024-07-30 05:25:11,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1208/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 1.0571473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:11,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.66044 samples/s/p 0:45:09 } +2024-07-30 05:25:14,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1210/ 3125], loss: 0.137, per_step_time: 1412ms, lr: 1.055024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:14,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.66276 samples/s/p 0:45:05 } +2024-07-30 05:25:17,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1212/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 1.0529023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:17,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.65983 samples/s/p 0:45:03 } +2024-07-30 05:25:20,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1214/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 1.0507816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:20,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.66088 samples/s/p 0:45:00 } +2024-07-30 05:25:23,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1216/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 1.0486639e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:23,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.66127 samples/s/p 0:44:57 } +2024-07-30 05:25:25,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1218/ 3125], loss: 0.406, per_step_time: 1413ms, lr: 1.0465478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:25,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.66016 samples/s/p 0:44:55 } +2024-07-30 05:25:28,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1220/ 3125], loss: 0.091, per_step_time: 1413ms, lr: 1.0444339e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:28,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.66118 samples/s/p 0:44:52 } +2024-07-30 05:25:31,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1222/ 3125], loss: 0.350, per_step_time: 1413ms, lr: 1.0423207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:31,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.65919 samples/s/p 0:44:50 } +2024-07-30 05:25:34,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1224/ 3125], loss: 0.416, per_step_time: 1413ms, lr: 1.0402107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:34,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.66051 samples/s/p 0:44:46 } +2024-07-30 05:25:37,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1226/ 3125], loss: 0.082, per_step_time: 1412ms, lr: 1.0381021e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:37,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.66176 samples/s/p 0:44:43 } +2024-07-30 05:25:40,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1228/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 1.0359954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:40,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.66056 samples/s/p 0:44:41 } +2024-07-30 05:25:42,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1230/ 3125], loss: 0.169, per_step_time: 1412ms, lr: 1.0338911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:42,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.66289 samples/s/p 0:44:37 } +2024-07-30 05:25:45,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1232/ 3125], loss: 0.450, per_step_time: 1413ms, lr: 1.0317883e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:45,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.65865 samples/s/p 0:44:36 } +2024-07-30 05:25:48,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1234/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 1.0296869e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:48,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.65964 samples/s/p 0:44:32 } +2024-07-30 05:25:51,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1236/ 3125], loss: 0.283, per_step_time: 1414ms, lr: 1.0275876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:51,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.65482 samples/s/p 0:44:32 } +2024-07-30 05:25:54,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1238/ 3125], loss: 0.423, per_step_time: 1412ms, lr: 1.0254902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:54,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.66300 samples/s/p 0:44:25 } +2024-07-30 05:25:57,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1240/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 1.023395e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:57,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.66069 samples/s/p 0:44:23 } +2024-07-30 05:25:59,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1242/ 3125], loss: 0.130, per_step_time: 1412ms, lr: 1.0213017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:25:59,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.66207 samples/s/p 0:44:20 } +2024-07-30 05:26:02,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1244/ 3125], loss: 0.291, per_step_time: 1413ms, lr: 1.0192105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:02,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.65896 samples/s/p 0:44:19 } +2024-07-30 05:26:05,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1246/ 3125], loss: 0.129, per_step_time: 1414ms, lr: 1.0171208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:05,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |███████████████████████████████████████ | 5.65519 samples/s/p 0:44:18 } +2024-07-30 05:26:08,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1248/ 3125], loss: 0.165, per_step_time: 1415ms, lr: 1.0150334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:08,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |███████████████████████████████████████ | 5.65345 samples/s/p 0:44:16 } +2024-07-30 05:26:11,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1250/ 3125], loss: 0.405, per_step_time: 1413ms, lr: 1.0129478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:11,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.66024 samples/s/p 0:44:10 } +2024-07-30 05:26:14,140 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1252/ 3125], loss: 0.290, per_step_time: 1414ms, lr: 1.0108635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:14,140 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.65614 samples/s/p 0:44:09 } +2024-07-30 05:26:16,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1254/ 3125], loss: 0.194, per_step_time: 1415ms, lr: 1.0087817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:16,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.65222 samples/s/p 0:44:08 } +2024-07-30 05:26:19,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1256/ 3125], loss: 0.357, per_step_time: 1414ms, lr: 1.0067016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:19,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.65726 samples/s/p 0:44:02 } +2024-07-30 05:26:22,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1258/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 1.0046228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:22,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.65783 samples/s/p 0:43:59 } +2024-07-30 05:26:25,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1260/ 3125], loss: 0.385, per_step_time: 1413ms, lr: 1.0025468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:25,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.65956 samples/s/p 0:43:56 } +2024-07-30 05:26:28,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1262/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 1.0004726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:28,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.66007 samples/s/p 0:43:53 } +2024-07-30 05:26:31,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1264/ 3125], loss: 0.344, per_step_time: 1414ms, lr: 9.984001e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:31,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.65404 samples/s/p 0:43:53 } +2024-07-30 05:26:33,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1266/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 9.963288e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:33,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.66006 samples/s/p 0:43:47 } +2024-07-30 05:26:36,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1268/ 3125], loss: 0.256, per_step_time: 1412ms, lr: 9.942609e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:36,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.66242 samples/s/p 0:43:43 } +2024-07-30 05:26:39,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1270/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 9.921941e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:39,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.66050 samples/s/p 0:43:41 } +2024-07-30 05:26:42,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1272/ 3125], loss: 0.419, per_step_time: 1419ms, lr: 9.901294e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:42,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.63524 samples/s/p 0:43:50 } +2024-07-30 05:26:45,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1274/ 3125], loss: 0.539, per_step_time: 1413ms, lr: 9.880667e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:45,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.66059 samples/s/p 0:43:35 } +2024-07-30 05:26:48,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1276/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 9.86006e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:48,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.66016 samples/s/p 0:43:33 } +2024-07-30 05:26:50,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1278/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 9.839463e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:50,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.66059 samples/s/p 0:43:30 } +2024-07-30 05:26:53,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1280/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 9.818893e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:53,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.66073 samples/s/p 0:43:27 } +2024-07-30 05:26:56,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1282/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 9.798335e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:56,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.65826 samples/s/p 0:43:25 } +2024-07-30 05:26:59,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1284/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 9.777805e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:26:59,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.65996 samples/s/p 0:43:22 } +2024-07-30 05:27:02,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1286/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 9.757292e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:02,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.66122 samples/s/p 0:43:18 } +2024-07-30 05:27:05,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1288/ 3125], loss: 0.435, per_step_time: 1413ms, lr: 9.7368e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:05,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.66004 samples/s/p 0:43:16 } +2024-07-30 05:27:08,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1290/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 9.716326e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:08,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.66118 samples/s/p 0:43:13 } +2024-07-30 05:27:10,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1292/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 9.695873e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:10,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.65971 samples/s/p 0:43:10 } +2024-07-30 05:27:13,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1294/ 3125], loss: 0.251, per_step_time: 1413ms, lr: 9.675427e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:13,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.66063 samples/s/p 0:43:07 } +2024-07-30 05:27:16,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1296/ 3125], loss: 0.406, per_step_time: 1412ms, lr: 9.655014e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:16,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.66222 samples/s/p 0:43:04 } +2024-07-30 05:27:19,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1298/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 9.634616e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:19,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.65929 samples/s/p 0:43:02 } +2024-07-30 05:27:22,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1300/ 3125], loss: 0.304, per_step_time: 1412ms, lr: 9.614238e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:22,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.66276 samples/s/p 0:42:58 } +2024-07-30 05:27:25,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1302/ 3125], loss: 0.200, per_step_time: 1415ms, lr: 9.593874e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:25,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.65345 samples/s/p 0:42:59 } +2024-07-30 05:27:27,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1304/ 3125], loss: 0.065, per_step_time: 1413ms, lr: 9.573533e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:27,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.66143 samples/s/p 0:42:53 } +2024-07-30 05:27:30,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1306/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 9.553214e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:30,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.65795 samples/s/p 0:42:51 } +2024-07-30 05:27:33,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1308/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 9.532913e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:33,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.65439 samples/s/p 0:42:50 } +2024-07-30 05:27:36,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1310/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 9.512627e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:36,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.65898 samples/s/p 0:42:45 } +2024-07-30 05:27:39,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1312/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 9.4923644e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:39,178 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.66133 samples/s/p 0:42:41 } +2024-07-30 05:27:42,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1314/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 9.4721196e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:42,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.66092 samples/s/p 0:42:39 } +2024-07-30 05:27:44,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1316/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 9.4518987e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:44,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.65975 samples/s/p 0:42:37 } +2024-07-30 05:27:47,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1318/ 3125], loss: 0.449, per_step_time: 1413ms, lr: 9.4316925e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:47,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.66118 samples/s/p 0:42:33 } +2024-07-30 05:27:50,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1320/ 3125], loss: 0.109, per_step_time: 1413ms, lr: 9.4115137e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:50,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.66148 samples/s/p 0:42:30 } +2024-07-30 05:27:53,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1322/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 9.391346e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:53,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.65936 samples/s/p 0:42:28 } +2024-07-30 05:27:56,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1324/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 9.371191e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:56,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.66047 samples/s/p 0:42:25 } +2024-07-30 05:27:59,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1326/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 9.3510596e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:27:59,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.66032 samples/s/p 0:42:22 } +2024-07-30 05:28:01,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1328/ 3125], loss: 0.412, per_step_time: 1413ms, lr: 9.330952e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:01,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.65982 samples/s/p 0:42:20 } +2024-07-30 05:28:04,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1330/ 3125], loss: 0.522, per_step_time: 1414ms, lr: 9.310865e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:04,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.65513 samples/s/p 0:42:19 } +2024-07-30 05:28:07,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1332/ 3125], loss: 0.282, per_step_time: 1415ms, lr: 9.2907993e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:07,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.65354 samples/s/p 0:42:17 } +2024-07-30 05:28:10,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1334/ 3125], loss: 0.511, per_step_time: 1413ms, lr: 9.270751e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:10,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.65967 samples/s/p 0:42:11 } +2024-07-30 05:28:13,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1336/ 3125], loss: 0.386, per_step_time: 1414ms, lr: 9.2507213e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:13,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.65580 samples/s/p 0:42:10 } +2024-07-30 05:28:16,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1338/ 3125], loss: 0.166, per_step_time: 1414ms, lr: 9.230703e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:16,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.65770 samples/s/p 0:42:06 } +2024-07-30 05:28:18,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1340/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 9.2107143e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:18,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.65809 samples/s/p 0:42:03 } +2024-07-30 05:28:21,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1342/ 3125], loss: 0.111, per_step_time: 1413ms, lr: 9.190744e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:21,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.65875 samples/s/p 0:42:00 } +2024-07-30 05:28:24,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1344/ 3125], loss: 0.151, per_step_time: 1413ms, lr: 9.1707915e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:24,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.66022 samples/s/p 0:41:57 } +2024-07-30 05:28:27,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1346/ 3125], loss: 0.495, per_step_time: 1413ms, lr: 9.1508593e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:27,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.66131 samples/s/p 0:41:53 } +2024-07-30 05:28:30,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1348/ 3125], loss: 0.077, per_step_time: 1413ms, lr: 9.1309425e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:30,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.66057 samples/s/p 0:41:51 } +2024-07-30 05:28:33,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1350/ 3125], loss: 0.083, per_step_time: 1412ms, lr: 9.1110496e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:33,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.66225 samples/s/p 0:41:47 } +2024-07-30 05:28:35,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1352/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 9.0911686e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:35,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.65914 samples/s/p 0:41:46 } +2024-07-30 05:28:38,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1354/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 9.071317e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:38,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.65998 samples/s/p 0:41:43 } +2024-07-30 05:28:41,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1356/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 9.0514806e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:41,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.65917 samples/s/p 0:41:40 } +2024-07-30 05:28:44,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1358/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 9.0316684e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:44,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.66058 samples/s/p 0:41:37 } +2024-07-30 05:28:47,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1360/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 9.011873e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:47,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.66087 samples/s/p 0:41:34 } +2024-07-30 05:28:50,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1362/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 8.992097e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:50,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.65882 samples/s/p 0:41:32 } +2024-07-30 05:28:52,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1364/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 8.972341e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:52,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.65883 samples/s/p 0:41:29 } +2024-07-30 05:28:55,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1366/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 8.9526e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:55,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.65850 samples/s/p 0:41:26 } +2024-07-30 05:28:58,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1368/ 3125], loss: 0.402, per_step_time: 1414ms, lr: 8.9328825e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:28:58,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.65666 samples/s/p 0:41:24 } +2024-07-30 05:29:01,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1370/ 3125], loss: 0.166, per_step_time: 1412ms, lr: 8.913186e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:01,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.66202 samples/s/p 0:41:19 } +2024-07-30 05:29:04,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1372/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 8.8935013e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:04,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.65919 samples/s/p 0:41:18 } +2024-07-30 05:29:07,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1374/ 3125], loss: 0.073, per_step_time: 1413ms, lr: 8.873841e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:07,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.66169 samples/s/p 0:41:14 } +2024-07-30 05:29:09,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1376/ 3125], loss: 0.277, per_step_time: 1412ms, lr: 8.854207e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:09,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.66269 samples/s/p 0:41:10 } +2024-07-30 05:29:12,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1378/ 3125], loss: 0.185, per_step_time: 1412ms, lr: 8.834588e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:12,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.66304 samples/s/p 0:41:07 } +2024-07-30 05:29:15,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1380/ 3125], loss: 0.412, per_step_time: 1412ms, lr: 8.8149875e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:15,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.66180 samples/s/p 0:41:05 } +2024-07-30 05:29:18,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1382/ 3125], loss: 0.171, per_step_time: 1413ms, lr: 8.795401e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:18,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.66047 samples/s/p 0:41:03 } +2024-07-30 05:29:21,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1384/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 8.7758417e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:21,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.66048 samples/s/p 0:41:00 } +2024-07-30 05:29:24,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1386/ 3125], loss: 0.316, per_step_time: 1414ms, lr: 8.7563006e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:24,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.65763 samples/s/p 0:40:58 } +2024-07-30 05:29:26,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1388/ 3125], loss: 0.225, per_step_time: 1412ms, lr: 8.736783e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:26,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.66253 samples/s/p 0:40:54 } +2024-07-30 05:29:29,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1390/ 3125], loss: 0.344, per_step_time: 1413ms, lr: 8.7172805e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:29,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.65996 samples/s/p 0:40:52 } +2024-07-30 05:29:32,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1392/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 8.697793e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:32,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.66162 samples/s/p 0:40:48 } +2024-07-30 05:29:35,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1394/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 8.678335e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:35,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.66096 samples/s/p 0:40:46 } +2024-07-30 05:29:38,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1396/ 3125], loss: 0.372, per_step_time: 1414ms, lr: 8.658886e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:38,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.65687 samples/s/p 0:40:45 } +2024-07-30 05:29:41,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1398/ 3125], loss: 0.180, per_step_time: 1414ms, lr: 8.6394635e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:41,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.65414 samples/s/p 0:40:43 } +2024-07-30 05:29:43,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1400/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 8.620065e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:43,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.65893 samples/s/p 0:40:38 } +2024-07-30 05:29:46,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1402/ 3125], loss: 0.256, per_step_time: 1415ms, lr: 8.6006816e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:46,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.65323 samples/s/p 0:40:38 } +2024-07-30 05:29:49,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1404/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 8.581319e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:49,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.66109 samples/s/p 0:40:32 } +2024-07-30 05:29:52,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1406/ 3125], loss: 0.133, per_step_time: 1413ms, lr: 8.5619746e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:52,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.65906 samples/s/p 0:40:30 } +2024-07-30 05:29:55,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1408/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 8.5426535e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:55,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.66025 samples/s/p 0:40:26 } +2024-07-30 05:29:58,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1410/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 8.523345e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:29:58,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.65914 samples/s/p 0:40:24 } +2024-07-30 05:30:00,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1412/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 8.5040597e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:00,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.65966 samples/s/p 0:40:21 } +2024-07-30 05:30:03,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1414/ 3125], loss: 0.133, per_step_time: 1414ms, lr: 8.4847983e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:03,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.65623 samples/s/p 0:40:19 } +2024-07-30 05:30:06,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1416/ 3125], loss: 0.201, per_step_time: 1413ms, lr: 8.4655494e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:06,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.65829 samples/s/p 0:40:16 } +2024-07-30 05:30:09,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1418/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 8.446324e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:09,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.66085 samples/s/p 0:40:12 } +2024-07-30 05:30:12,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1420/ 3125], loss: 0.274, per_step_time: 1425ms, lr: 8.427119e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:12,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.61072 samples/s/p 0:40:31 } +2024-07-30 05:30:15,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1422/ 3125], loss: 0.061, per_step_time: 1413ms, lr: 8.407938e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:15,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.66142 samples/s/p 0:40:06 } +2024-07-30 05:30:17,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1424/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 8.3887664e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:17,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.65990 samples/s/p 0:40:04 } +2024-07-30 05:30:20,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1426/ 3125], loss: 0.204, per_step_time: 1414ms, lr: 8.3696216e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:20,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.65442 samples/s/p 0:40:03 } +2024-07-30 05:30:23,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1428/ 3125], loss: 0.108, per_step_time: 1413ms, lr: 8.3505e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:23,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.66081 samples/s/p 0:39:58 } +2024-07-30 05:30:26,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1430/ 3125], loss: 0.045, per_step_time: 1414ms, lr: 8.331391e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:26,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.65749 samples/s/p 0:39:56 } +2024-07-30 05:30:29,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1432/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 8.3123115e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:29,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.66031 samples/s/p 0:39:52 } +2024-07-30 05:30:32,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1434/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 8.293244e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:32,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |████████████████████████████████████████ | 5.66038 samples/s/p 0:39:49 } +2024-07-30 05:30:34,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1436/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 8.2741946e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:34,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |████████████████████████████████████████ | 5.66010 samples/s/p 0:39:47 } +2024-07-30 05:30:37,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1438/ 3125], loss: 0.568, per_step_time: 1413ms, lr: 8.2551685e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:37,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.65782 samples/s/p 0:39:45 } +2024-07-30 05:30:40,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1440/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 8.236155e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:40,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.66148 samples/s/p 0:39:41 } +2024-07-30 05:30:43,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1442/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 8.217174e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:43,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.66084 samples/s/p 0:39:38 } +2024-07-30 05:30:46,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1444/ 3125], loss: 0.327, per_step_time: 1413ms, lr: 8.1982074e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:46,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.66005 samples/s/p 0:39:35 } +2024-07-30 05:30:49,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1446/ 3125], loss: 0.187, per_step_time: 1412ms, lr: 8.179262e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:49,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.66200 samples/s/p 0:39:32 } +2024-07-30 05:30:51,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1448/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 8.160338e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:51,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.65941 samples/s/p 0:39:30 } +2024-07-30 05:30:54,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1450/ 3125], loss: 0.391, per_step_time: 1413ms, lr: 8.141431e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:54,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.66151 samples/s/p 0:39:26 } +2024-07-30 05:30:57,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1452/ 3125], loss: 0.133, per_step_time: 1417ms, lr: 8.1225454e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:30:57,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.64572 samples/s/p 0:39:30 } +2024-07-30 05:31:00,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1454/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 8.1036774e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:00,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.66004 samples/s/p 0:39:21 } +2024-07-30 05:31:03,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1456/ 3125], loss: 0.208, per_step_time: 1412ms, lr: 8.0848275e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:03,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.66270 samples/s/p 0:39:17 } +2024-07-30 05:31:06,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1458/ 3125], loss: 0.203, per_step_time: 1412ms, lr: 8.0660044e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:06,089 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.66179 samples/s/p 0:39:15 } +2024-07-30 05:31:08,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1460/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 8.047193e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:08,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.65931 samples/s/p 0:39:13 } +2024-07-30 05:31:11,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1462/ 3125], loss: 0.264, per_step_time: 1414ms, lr: 8.028409e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:11,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.65750 samples/s/p 0:39:11 } +2024-07-30 05:31:14,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1464/ 3125], loss: 0.249, per_step_time: 1413ms, lr: 8.0096453e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:14,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.66075 samples/s/p 0:39:07 } +2024-07-30 05:31:17,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1466/ 3125], loss: 0.311, per_step_time: 1413ms, lr: 7.9908966e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:17,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.65789 samples/s/p 0:39:05 } +2024-07-30 05:31:20,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1468/ 3125], loss: 0.140, per_step_time: 1412ms, lr: 7.9721656e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:20,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.66234 samples/s/p 0:39:01 } +2024-07-30 05:31:23,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1470/ 3125], loss: 0.457, per_step_time: 1413ms, lr: 7.9534647e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:23,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.65942 samples/s/p 0:38:59 } +2024-07-30 05:31:25,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1472/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 7.9347785e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:25,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.66066 samples/s/p 0:38:56 } +2024-07-30 05:31:28,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1474/ 3125], loss: 0.316, per_step_time: 1414ms, lr: 7.916108e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:28,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.65427 samples/s/p 0:38:55 } +2024-07-30 05:31:31,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1476/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 7.8974665e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:31,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.65794 samples/s/p 0:38:51 } +2024-07-30 05:31:34,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1478/ 3125], loss: 0.465, per_step_time: 1414ms, lr: 7.87884e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:34,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.65759 samples/s/p 0:38:48 } +2024-07-30 05:31:37,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1480/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 7.860231e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:37,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.65798 samples/s/p 0:38:45 } +2024-07-30 05:31:40,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1482/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 7.841646e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:40,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.65842 samples/s/p 0:38:42 } +2024-07-30 05:31:42,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1484/ 3125], loss: 0.245, per_step_time: 1414ms, lr: 7.8230767e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:42,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.65585 samples/s/p 0:38:41 } +2024-07-30 05:31:45,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1486/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 7.804531e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:45,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.65844 samples/s/p 0:38:37 } +2024-07-30 05:31:48,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1488/ 3125], loss: 0.317, per_step_time: 1414ms, lr: 7.7860085e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:48,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.65371 samples/s/p 0:38:36 } +2024-07-30 05:31:51,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1490/ 3125], loss: 0.481, per_step_time: 1412ms, lr: 7.767504e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:51,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.66343 samples/s/p 0:38:29 } +2024-07-30 05:31:54,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1492/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 7.7490176e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:54,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.66094 samples/s/p 0:38:27 } +2024-07-30 05:31:57,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1494/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 7.7305555e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:57,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.65782 samples/s/p 0:38:26 } +2024-07-30 05:31:59,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1496/ 3125], loss: 0.301, per_step_time: 1413ms, lr: 7.7121075e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:31:59,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.66103 samples/s/p 0:38:22 } +2024-07-30 05:32:02,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1498/ 3125], loss: 0.152, per_step_time: 1412ms, lr: 7.693684e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:02,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.66190 samples/s/p 0:38:18 } +2024-07-30 05:32:05,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1500/ 3125], loss: 0.262, per_step_time: 1415ms, lr: 7.675281e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:05,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.65042 samples/s/p 0:38:20 } +2024-07-30 05:32:08,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1502/ 3125], loss: 0.083, per_step_time: 1413ms, lr: 7.656899e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:08,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.66033 samples/s/p 0:38:13 } +2024-07-30 05:32:11,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1504/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 7.6385317e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:11,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.66167 samples/s/p 0:38:10 } +2024-07-30 05:32:14,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1506/ 3125], loss: 0.193, per_step_time: 1414ms, lr: 7.6201883e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:14,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.65685 samples/s/p 0:38:09 } +2024-07-30 05:32:16,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1508/ 3125], loss: 0.138, per_step_time: 1413ms, lr: 7.601866e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:16,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.66075 samples/s/p 0:38:05 } +2024-07-30 05:32:19,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1510/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 7.583564e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:19,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.66042 samples/s/p 0:38:02 } +2024-07-30 05:32:22,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1512/ 3125], loss: 0.093, per_step_time: 1413ms, lr: 7.5652775e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:22,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.65941 samples/s/p 0:38:00 } +2024-07-30 05:32:25,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1514/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 7.547015e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:25,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.66041 samples/s/p 0:37:56 } +2024-07-30 05:32:28,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1516/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 7.5287755e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:28,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.65923 samples/s/p 0:37:54 } +2024-07-30 05:32:31,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1518/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 7.5105544e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:31,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.66088 samples/s/p 0:37:51 } +2024-07-30 05:32:33,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1520/ 3125], loss: 0.386, per_step_time: 1412ms, lr: 7.492354e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:33,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.66214 samples/s/p 0:37:47 } +2024-07-30 05:32:36,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1522/ 3125], loss: 0.440, per_step_time: 1413ms, lr: 7.474175e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:36,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.65864 samples/s/p 0:37:46 } +2024-07-30 05:32:39,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1524/ 3125], loss: 0.357, per_step_time: 1413ms, lr: 7.4560074e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:39,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.65781 samples/s/p 0:37:43 } +2024-07-30 05:32:42,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1526/ 3125], loss: 0.135, per_step_time: 1412ms, lr: 7.43787e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:42,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.66288 samples/s/p 0:37:38 } +2024-07-30 05:32:45,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1528/ 3125], loss: 0.246, per_step_time: 1414ms, lr: 7.419744e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:45,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.65600 samples/s/p 0:37:38 } +2024-07-30 05:32:48,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1530/ 3125], loss: 0.320, per_step_time: 1413ms, lr: 7.401645e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:48,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.66023 samples/s/p 0:37:34 } +2024-07-30 05:32:50,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1532/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 7.383564e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:50,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.65900 samples/s/p 0:37:31 } +2024-07-30 05:32:53,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1534/ 3125], loss: 0.174, per_step_time: 1412ms, lr: 7.3655065e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:53,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.66204 samples/s/p 0:37:27 } +2024-07-30 05:32:56,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1536/ 3125], loss: 0.302, per_step_time: 1412ms, lr: 7.3474706e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:56,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.66261 samples/s/p 0:37:24 } +2024-07-30 05:32:59,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1538/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 7.3294547e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:32:59,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.66134 samples/s/p 0:37:22 } +2024-07-30 05:33:02,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1540/ 3125], loss: 0.191, per_step_time: 1414ms, lr: 7.311451e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:02,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.65761 samples/s/p 0:37:21 } +2024-07-30 05:33:05,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1542/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 7.2934745e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:05,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.66021 samples/s/p 0:37:17 } +2024-07-30 05:33:07,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1544/ 3125], loss: 0.098, per_step_time: 1413ms, lr: 7.2755154e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:07,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.66132 samples/s/p 0:37:14 } +2024-07-30 05:33:10,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1546/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 7.2575807e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:10,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.65944 samples/s/p 0:37:12 } +2024-07-30 05:33:13,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1548/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 7.23966e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:13,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.66008 samples/s/p 0:37:08 } +2024-07-30 05:33:16,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1550/ 3125], loss: 0.208, per_step_time: 1414ms, lr: 7.221764e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:16,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.65737 samples/s/p 0:37:07 } +2024-07-30 05:33:19,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1552/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 7.2038887e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:19,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.65909 samples/s/p 0:37:03 } +2024-07-30 05:33:22,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1554/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 7.186028e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:22,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.65782 samples/s/p 0:37:01 } +2024-07-30 05:33:24,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1556/ 3125], loss: 0.212, per_step_time: 1412ms, lr: 7.168197e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:24,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.66251 samples/s/p 0:36:56 } +2024-07-30 05:33:27,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1558/ 3125], loss: 0.151, per_step_time: 1424ms, lr: 7.1503814e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:27,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.61445 samples/s/p 0:37:12 } +2024-07-30 05:33:30,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1560/ 3125], loss: 0.207, per_step_time: 1414ms, lr: 7.1325894e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:30,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.65672 samples/s/p 0:36:53 } +2024-07-30 05:33:33,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1562/ 3125], loss: 0.316, per_step_time: 1414ms, lr: 7.1148185e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:33,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.65703 samples/s/p 0:36:50 } +2024-07-30 05:33:36,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1564/ 3125], loss: 0.232, per_step_time: 1414ms, lr: 7.097065e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:36,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.65462 samples/s/p 0:36:48 } +2024-07-30 05:33:39,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1566/ 3125], loss: 0.191, per_step_time: 1414ms, lr: 7.079333e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:39,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.65762 samples/s/p 0:36:44 } +2024-07-30 05:33:41,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1568/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 7.061618e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:41,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.66050 samples/s/p 0:36:40 } +2024-07-30 05:33:44,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1570/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 7.043928e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:44,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.66054 samples/s/p 0:36:37 } +2024-07-30 05:33:47,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1572/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 7.026252e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:47,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.65922 samples/s/p 0:36:35 } +2024-07-30 05:33:50,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1574/ 3125], loss: 0.055, per_step_time: 1412ms, lr: 7.008603e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:50,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.66226 samples/s/p 0:36:31 } +2024-07-30 05:33:53,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1576/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 6.990972e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:53,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.66155 samples/s/p 0:36:28 } +2024-07-30 05:33:56,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1578/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 6.973365e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:56,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.65918 samples/s/p 0:36:26 } +2024-07-30 05:33:58,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1580/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 6.9557757e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:33:58,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.66013 samples/s/p 0:36:23 } +2024-07-30 05:34:01,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1582/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 6.93821e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:01,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.65957 samples/s/p 0:36:21 } +2024-07-30 05:34:04,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1584/ 3125], loss: 0.180, per_step_time: 1413ms, lr: 6.920656e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:04,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.66161 samples/s/p 0:36:17 } +2024-07-30 05:34:07,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1586/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 6.9031324e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:07,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.65830 samples/s/p 0:36:15 } +2024-07-30 05:34:10,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1588/ 3125], loss: 0.271, per_step_time: 1413ms, lr: 6.8856235e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:10,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.66124 samples/s/p 0:36:11 } +2024-07-30 05:34:13,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1590/ 3125], loss: 0.266, per_step_time: 1412ms, lr: 6.868142e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:13,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.66201 samples/s/p 0:36:08 } +2024-07-30 05:34:16,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1592/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 6.8506716e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:16,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.65997 samples/s/p 0:36:06 } +2024-07-30 05:34:18,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1594/ 3125], loss: 0.330, per_step_time: 1414ms, lr: 6.833228e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:18,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.65583 samples/s/p 0:36:05 } +2024-07-30 05:34:21,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1596/ 3125], loss: 0.382, per_step_time: 1413ms, lr: 6.8158056e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:21,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.66071 samples/s/p 0:36:00 } +2024-07-30 05:34:24,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1598/ 3125], loss: 0.272, per_step_time: 1413ms, lr: 6.7983956e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:24,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.65927 samples/s/p 0:35:58 } +2024-07-30 05:34:27,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1600/ 3125], loss: 0.229, per_step_time: 1413ms, lr: 6.7810146e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:27,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.65946 samples/s/p 0:35:55 } +2024-07-30 05:34:30,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1602/ 3125], loss: 0.294, per_step_time: 1413ms, lr: 6.763652e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:30,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.65956 samples/s/p 0:35:52 } +2024-07-30 05:34:33,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1604/ 3125], loss: 0.324, per_step_time: 1414ms, lr: 6.74631e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:33,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.65735 samples/s/p 0:35:50 } +2024-07-30 05:34:35,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1606/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 6.7289915e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:35,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.65872 samples/s/p 0:35:47 } +2024-07-30 05:34:38,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1608/ 3125], loss: 0.196, per_step_time: 1414ms, lr: 6.711691e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:38,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.65653 samples/s/p 0:35:45 } +2024-07-30 05:34:41,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1610/ 3125], loss: 0.134, per_step_time: 1412ms, lr: 6.694412e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:41,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.66223 samples/s/p 0:35:40 } +2024-07-30 05:34:44,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1612/ 3125], loss: 0.206, per_step_time: 1415ms, lr: 6.67715e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:44,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.65158 samples/s/p 0:35:41 } +2024-07-30 05:34:47,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1614/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 6.659913e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:47,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.65949 samples/s/p 0:35:35 } +2024-07-30 05:34:50,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1616/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 6.64269e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:50,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.66075 samples/s/p 0:35:32 } +2024-07-30 05:34:52,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1618/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 6.6254944e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:52,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.66143 samples/s/p 0:35:29 } +2024-07-30 05:34:55,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1620/ 3125], loss: 0.217, per_step_time: 1412ms, lr: 6.608319e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:55,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.66222 samples/s/p 0:35:26 } +2024-07-30 05:34:58,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1622/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 6.591165e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:34:58,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |█████████████████████████████████████████ | 5.65998 samples/s/p 0:35:24 } +2024-07-30 05:35:01,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1624/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 6.574032e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:01,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |█████████████████████████████████████████ | 5.65847 samples/s/p 0:35:22 } +2024-07-30 05:35:04,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1626/ 3125], loss: 0.105, per_step_time: 1414ms, lr: 6.55691e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:04,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.65741 samples/s/p 0:35:19 } +2024-07-30 05:35:07,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1628/ 3125], loss: 0.344, per_step_time: 1419ms, lr: 6.5398183e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:07,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.63526 samples/s/p 0:35:25 } +2024-07-30 05:35:09,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1630/ 3125], loss: 0.373, per_step_time: 1417ms, lr: 6.5227505e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:09,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.64537 samples/s/p 0:35:18 } +2024-07-30 05:35:12,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1632/ 3125], loss: 0.218, per_step_time: 1413ms, lr: 6.505698e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:12,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.65898 samples/s/p 0:35:10 } +2024-07-30 05:35:15,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1634/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 6.488666e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:15,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.65929 samples/s/p 0:35:07 } +2024-07-30 05:35:18,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1636/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 6.471661e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:18,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.65879 samples/s/p 0:35:05 } +2024-07-30 05:35:21,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1638/ 3125], loss: 0.127, per_step_time: 1413ms, lr: 6.4546646e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:21,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.66162 samples/s/p 0:35:01 } +2024-07-30 05:35:24,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1640/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 6.4376917e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:24,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.65882 samples/s/p 0:34:59 } +2024-07-30 05:35:26,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1642/ 3125], loss: 0.100, per_step_time: 1413ms, lr: 6.420746e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:26,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.66090 samples/s/p 0:34:55 } +2024-07-30 05:35:29,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1644/ 3125], loss: 0.177, per_step_time: 1415ms, lr: 6.4038187e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:29,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.65270 samples/s/p 0:34:55 } +2024-07-30 05:35:32,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1646/ 3125], loss: 0.263, per_step_time: 1412ms, lr: 6.386912e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:32,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.66177 samples/s/p 0:34:49 } +2024-07-30 05:35:35,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1648/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 6.3700315e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:35,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.65974 samples/s/p 0:34:47 } +2024-07-30 05:35:38,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1650/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 6.3531667e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:38,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.65977 samples/s/p 0:34:44 } +2024-07-30 05:35:41,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1652/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 6.336322e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:41,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.66066 samples/s/p 0:34:41 } +2024-07-30 05:35:43,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1654/ 3125], loss: 0.257, per_step_time: 1412ms, lr: 6.319502e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:43,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.66216 samples/s/p 0:34:38 } +2024-07-30 05:35:46,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1656/ 3125], loss: 0.157, per_step_time: 1412ms, lr: 6.3026965e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:46,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.66270 samples/s/p 0:34:35 } +2024-07-30 05:35:49,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1658/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 6.285912e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:49,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.65840 samples/s/p 0:34:34 } +2024-07-30 05:35:52,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1660/ 3125], loss: 0.242, per_step_time: 1412ms, lr: 6.269154e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:52,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.66177 samples/s/p 0:34:30 } +2024-07-30 05:35:55,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1662/ 3125], loss: 0.259, per_step_time: 1412ms, lr: 6.2524106e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:55,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.66194 samples/s/p 0:34:27 } +2024-07-30 05:35:58,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1664/ 3125], loss: 0.147, per_step_time: 1415ms, lr: 6.2356946e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:35:58,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.65152 samples/s/p 0:34:28 } +2024-07-30 05:36:00,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1666/ 3125], loss: 0.201, per_step_time: 1412ms, lr: 6.2189963e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:00,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.66217 samples/s/p 0:34:21 } +2024-07-30 05:36:03,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1668/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 6.202322e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:03,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.65826 samples/s/p 0:34:19 } +2024-07-30 05:36:06,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1670/ 3125], loss: 0.194, per_step_time: 1414ms, lr: 6.1856593e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:06,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.65746 samples/s/p 0:34:17 } +2024-07-30 05:36:09,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1672/ 3125], loss: 0.371, per_step_time: 1414ms, lr: 6.169027e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:09,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.65651 samples/s/p 0:34:14 } +2024-07-30 05:36:12,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1674/ 3125], loss: 0.211, per_step_time: 1414ms, lr: 6.152415e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:12,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.65766 samples/s/p 0:34:11 } +2024-07-30 05:36:15,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1676/ 3125], loss: 0.320, per_step_time: 1414ms, lr: 6.135824e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:15,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.65687 samples/s/p 0:34:09 } +2024-07-30 05:36:17,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1678/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 6.119251e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:17,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.66149 samples/s/p 0:34:04 } +2024-07-30 05:36:20,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1680/ 3125], loss: 0.404, per_step_time: 1412ms, lr: 6.1026986e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:20,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.66171 samples/s/p 0:34:01 } +2024-07-30 05:36:23,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1682/ 3125], loss: 0.209, per_step_time: 1413ms, lr: 6.0861674e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:23,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.66002 samples/s/p 0:33:59 } +2024-07-30 05:36:26,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1684/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 6.069654e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:26,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.66014 samples/s/p 0:33:56 } +2024-07-30 05:36:29,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1686/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 6.053165e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:29,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.66083 samples/s/p 0:33:53 } +2024-07-30 05:36:32,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1688/ 3125], loss: 0.224, per_step_time: 1412ms, lr: 6.036699e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:32,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.66186 samples/s/p 0:33:50 } +2024-07-30 05:36:34,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1690/ 3125], loss: 0.472, per_step_time: 1412ms, lr: 6.0202535e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:34,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.66323 samples/s/p 0:33:47 } +2024-07-30 05:36:37,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1692/ 3125], loss: 0.378, per_step_time: 1413ms, lr: 6.003827e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:37,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.65987 samples/s/p 0:33:45 } +2024-07-30 05:36:40,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1694/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 5.9874264e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:40,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.66148 samples/s/p 0:33:42 } +2024-07-30 05:36:43,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1696/ 3125], loss: 0.134, per_step_time: 1412ms, lr: 5.971044e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:43,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.66220 samples/s/p 0:33:39 } +2024-07-30 05:36:46,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1698/ 3125], loss: 0.266, per_step_time: 1413ms, lr: 5.9546767e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:46,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.65983 samples/s/p 0:33:37 } +2024-07-30 05:36:49,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1700/ 3125], loss: 0.364, per_step_time: 1413ms, lr: 5.938336e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:49,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.66015 samples/s/p 0:33:34 } +2024-07-30 05:36:51,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1702/ 3125], loss: 0.365, per_step_time: 1413ms, lr: 5.922016e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:51,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.65849 samples/s/p 0:33:31 } +2024-07-30 05:36:54,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1704/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 5.9057203e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:54,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.65866 samples/s/p 0:33:28 } +2024-07-30 05:36:57,565 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1706/ 3125], loss: 0.215, per_step_time: 1414ms, lr: 5.8894364e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:36:57,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.65426 samples/s/p 0:33:27 } +2024-07-30 05:37:00,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1708/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 5.8731825e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:00,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.66063 samples/s/p 0:33:22 } +2024-07-30 05:37:03,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1710/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 5.856946e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:03,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.66004 samples/s/p 0:33:19 } +2024-07-30 05:37:06,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1712/ 3125], loss: 0.234, per_step_time: 1413ms, lr: 5.8407306e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:06,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.65811 samples/s/p 0:33:17 } +2024-07-30 05:37:08,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1714/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 5.824533e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:08,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.65981 samples/s/p 0:33:14 } +2024-07-30 05:37:11,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1716/ 3125], loss: 0.192, per_step_time: 1414ms, lr: 5.8083623e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:11,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.65509 samples/s/p 0:33:13 } +2024-07-30 05:37:14,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1718/ 3125], loss: 0.193, per_step_time: 1414ms, lr: 5.792209e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:14,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.65562 samples/s/p 0:33:10 } +2024-07-30 05:37:17,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1720/ 3125], loss: 0.420, per_step_time: 1414ms, lr: 5.7760803e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:17,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.65749 samples/s/p 0:33:06 } +2024-07-30 05:37:20,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1722/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 5.759972e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:20,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.65794 samples/s/p 0:33:03 } +2024-07-30 05:37:23,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1724/ 3125], loss: 0.136, per_step_time: 1415ms, lr: 5.7438876e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:23,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.65325 samples/s/p 0:33:02 } +2024-07-30 05:37:25,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1726/ 3125], loss: 0.655, per_step_time: 1415ms, lr: 5.7278123e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:25,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.65347 samples/s/p 0:32:59 } +2024-07-30 05:37:28,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1728/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 5.71177e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:28,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.66062 samples/s/p 0:32:54 } +2024-07-30 05:37:31,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1730/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 5.6957424e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:31,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.66046 samples/s/p 0:32:51 } +2024-07-30 05:37:34,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1732/ 3125], loss: 0.220, per_step_time: 1413ms, lr: 5.6797353e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:34,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.66078 samples/s/p 0:32:48 } +2024-07-30 05:37:37,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1734/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 5.6637555e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:37,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.65984 samples/s/p 0:32:46 } +2024-07-30 05:37:40,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1736/ 3125], loss: 0.166, per_step_time: 1412ms, lr: 5.647793e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:40,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.66222 samples/s/p 0:32:42 } +2024-07-30 05:37:42,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1738/ 3125], loss: 0.089, per_step_time: 1413ms, lr: 5.631855e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:42,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.66054 samples/s/p 0:32:40 } +2024-07-30 05:37:45,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1740/ 3125], loss: 0.575, per_step_time: 1413ms, lr: 5.6159377e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:45,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.66128 samples/s/p 0:32:37 } +2024-07-30 05:37:48,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1742/ 3125], loss: 0.189, per_step_time: 1413ms, lr: 5.600035e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:48,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.66022 samples/s/p 0:32:34 } +2024-07-30 05:37:51,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1744/ 3125], loss: 0.258, per_step_time: 1412ms, lr: 5.5841593e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:51,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.66182 samples/s/p 0:32:31 } +2024-07-30 05:37:54,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1746/ 3125], loss: 0.254, per_step_time: 1412ms, lr: 5.5683046e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:54,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.66321 samples/s/p 0:32:28 } +2024-07-30 05:37:57,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1748/ 3125], loss: 0.137, per_step_time: 1413ms, lr: 5.5524737e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:57,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.66014 samples/s/p 0:32:26 } +2024-07-30 05:37:59,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1750/ 3125], loss: 0.195, per_step_time: 1414ms, lr: 5.536655e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:37:59,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.65562 samples/s/p 0:32:24 } +2024-07-30 05:38:02,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1752/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 5.5208653e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:02,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.66094 samples/s/p 0:32:20 } +2024-07-30 05:38:05,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1754/ 3125], loss: 0.277, per_step_time: 1412ms, lr: 5.505097e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:05,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.66249 samples/s/p 0:32:16 } +2024-07-30 05:38:08,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1756/ 3125], loss: 0.154, per_step_time: 1413ms, lr: 5.4893405e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:08,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.65871 samples/s/p 0:32:15 } +2024-07-30 05:38:11,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1758/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 5.4736165e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:11,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.65995 samples/s/p 0:32:12 } +2024-07-30 05:38:14,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1760/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 5.457908e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:14,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.66107 samples/s/p 0:32:08 } +2024-07-30 05:38:16,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1762/ 3125], loss: 0.158, per_step_time: 1413ms, lr: 5.442223e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:16,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.65805 samples/s/p 0:32:07 } +2024-07-30 05:38:19,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1764/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 5.4265615e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:19,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.66074 samples/s/p 0:32:03 } +2024-07-30 05:38:22,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1766/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 5.4109216e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:22,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.66095 samples/s/p 0:32:00 } +2024-07-30 05:38:25,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1768/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 5.395296e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:25,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.66065 samples/s/p 0:31:57 } +2024-07-30 05:38:28,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1770/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 5.379692e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:28,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.66115 samples/s/p 0:31:54 } +2024-07-30 05:38:31,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1772/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 5.364117e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:31,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.66080 samples/s/p 0:31:52 } +2024-07-30 05:38:33,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1774/ 3125], loss: 0.285, per_step_time: 1413ms, lr: 5.3485513e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:33,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.65774 samples/s/p 0:31:50 } +2024-07-30 05:38:36,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1776/ 3125], loss: 0.198, per_step_time: 1413ms, lr: 5.333021e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:36,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.66105 samples/s/p 0:31:46 } +2024-07-30 05:38:39,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1778/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 5.317503e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:39,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.66051 samples/s/p 0:31:43 } +2024-07-30 05:38:42,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1780/ 3125], loss: 0.378, per_step_time: 1414ms, lr: 5.302012e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:42,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.65737 samples/s/p 0:31:41 } +2024-07-30 05:38:45,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1782/ 3125], loss: 0.191, per_step_time: 1414ms, lr: 5.2865414e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:45,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.65381 samples/s/p 0:31:40 } +2024-07-30 05:38:48,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1784/ 3125], loss: 0.450, per_step_time: 1413ms, lr: 5.271089e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:48,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.65999 samples/s/p 0:31:35 } +2024-07-30 05:38:50,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1786/ 3125], loss: 0.255, per_step_time: 1412ms, lr: 5.2556544e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:50,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.66212 samples/s/p 0:31:31 } +2024-07-30 05:38:53,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1788/ 3125], loss: 0.179, per_step_time: 1414ms, lr: 5.240249e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:53,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.65424 samples/s/p 0:31:31 } +2024-07-30 05:38:56,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1790/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 5.2248623e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:56,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.66125 samples/s/p 0:31:26 } +2024-07-30 05:38:59,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1792/ 3125], loss: 0.286, per_step_time: 1413ms, lr: 5.2094964e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:38:59,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.65987 samples/s/p 0:31:24 } +2024-07-30 05:39:02,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1794/ 3125], loss: 0.345, per_step_time: 1413ms, lr: 5.194148e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:02,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.65910 samples/s/p 0:31:21 } +2024-07-30 05:39:05,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1796/ 3125], loss: 0.381, per_step_time: 1413ms, lr: 5.178827e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:05,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.65792 samples/s/p 0:31:19 } +2024-07-30 05:39:07,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1798/ 3125], loss: 0.233, per_step_time: 1413ms, lr: 5.1635266e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:07,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.66116 samples/s/p 0:31:15 } +2024-07-30 05:39:10,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1800/ 3125], loss: 0.104, per_step_time: 1413ms, lr: 5.1482436e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:10,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.65802 samples/s/p 0:31:13 } +2024-07-30 05:39:13,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1802/ 3125], loss: 0.427, per_step_time: 1414ms, lr: 5.132985e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:13,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.65755 samples/s/p 0:31:10 } +2024-07-30 05:39:16,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1804/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 5.11775e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:16,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.66033 samples/s/p 0:31:07 } +2024-07-30 05:39:19,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1806/ 3125], loss: 0.253, per_step_time: 1414ms, lr: 5.102533e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:19,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.65478 samples/s/p 0:31:06 } +2024-07-30 05:39:22,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1808/ 3125], loss: 0.403, per_step_time: 1414ms, lr: 5.08734e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:22,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.65768 samples/s/p 0:31:02 } +2024-07-30 05:39:24,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1810/ 3125], loss: 0.121, per_step_time: 1413ms, lr: 5.072167e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:24,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.65975 samples/s/p 0:30:58 } +2024-07-30 05:39:27,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1812/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 5.057019e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:27,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.65951 samples/s/p 0:30:55 } +2024-07-30 05:39:30,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1814/ 3125], loss: 0.128, per_step_time: 1414ms, lr: 5.0418885e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:30,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |███████████████████████████████████████████ | 5.65486 samples/s/p 0:30:54 } +2024-07-30 05:39:33,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1816/ 3125], loss: 0.300, per_step_time: 1414ms, lr: 5.0267784e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:33,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |███████████████████████████████████████████ | 5.65695 samples/s/p 0:30:51 } +2024-07-30 05:39:36,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1818/ 3125], loss: 0.304, per_step_time: 1414ms, lr: 5.0116836e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:36,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.65592 samples/s/p 0:30:48 } +2024-07-30 05:39:39,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1820/ 3125], loss: 0.252, per_step_time: 1415ms, lr: 4.996621e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:39,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.65163 samples/s/p 0:30:47 } +2024-07-30 05:39:41,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1822/ 3125], loss: 0.149, per_step_time: 1414ms, lr: 4.981577e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:41,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.65405 samples/s/p 0:30:43 } +2024-07-30 05:39:44,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1824/ 3125], loss: 0.332, per_step_time: 1414ms, lr: 4.966557e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:44,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.65766 samples/s/p 0:30:39 } +2024-07-30 05:39:47,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1826/ 3125], loss: 0.327, per_step_time: 1414ms, lr: 4.9515575e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:47,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.65609 samples/s/p 0:30:37 } +2024-07-30 05:39:50,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1828/ 3125], loss: 0.129, per_step_time: 1415ms, lr: 4.936573e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:50,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.64990 samples/s/p 0:30:36 } +2024-07-30 05:39:53,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1830/ 3125], loss: 0.336, per_step_time: 1414ms, lr: 4.921615e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:53,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.65498 samples/s/p 0:30:32 } +2024-07-30 05:39:56,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1832/ 3125], loss: 0.366, per_step_time: 1414ms, lr: 4.906681e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:56,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.65400 samples/s/p 0:30:29 } +2024-07-30 05:39:58,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1834/ 3125], loss: 0.434, per_step_time: 1414ms, lr: 4.891765e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:39:58,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.65539 samples/s/p 0:30:26 } +2024-07-30 05:40:01,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1836/ 3125], loss: 0.215, per_step_time: 1415ms, lr: 4.8768726e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:01,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.65248 samples/s/p 0:30:24 } +2024-07-30 05:40:04,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1838/ 3125], loss: 0.347, per_step_time: 1415ms, lr: 4.8619955e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:04,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.65121 samples/s/p 0:30:21 } +2024-07-30 05:40:07,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1840/ 3125], loss: 0.267, per_step_time: 1414ms, lr: 4.847148e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:07,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.65403 samples/s/p 0:30:18 } +2024-07-30 05:40:10,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1842/ 3125], loss: 0.263, per_step_time: 1414ms, lr: 4.8323153e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:10,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.65605 samples/s/p 0:30:14 } +2024-07-30 05:40:13,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1844/ 3125], loss: 0.343, per_step_time: 1414ms, lr: 4.8175065e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:13,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.65601 samples/s/p 0:30:11 } +2024-07-30 05:40:15,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1846/ 3125], loss: 0.308, per_step_time: 1413ms, lr: 4.802728e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:15,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.65945 samples/s/p 0:30:07 } +2024-07-30 05:40:18,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1848/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 4.7879604e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:18,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.66079 samples/s/p 0:30:04 } +2024-07-30 05:40:21,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1850/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 4.7732203e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:21,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.66048 samples/s/p 0:30:01 } +2024-07-30 05:40:24,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1852/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 4.758501e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:24,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.66084 samples/s/p 0:29:59 } +2024-07-30 05:40:27,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1854/ 3125], loss: 0.448, per_step_time: 1413ms, lr: 4.7438024e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:27,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.66147 samples/s/p 0:29:56 } +2024-07-30 05:40:30,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1856/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 4.7291277e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:30,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.66136 samples/s/p 0:29:53 } +2024-07-30 05:40:32,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1858/ 3125], loss: 0.332, per_step_time: 1414ms, lr: 4.714465e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:32,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.65762 samples/s/p 0:29:51 } +2024-07-30 05:40:35,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1860/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 4.699832e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:35,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.65850 samples/s/p 0:29:48 } +2024-07-30 05:40:38,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1862/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 4.685214e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:38,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.65794 samples/s/p 0:29:45 } +2024-07-30 05:40:41,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1864/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 4.670626e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:41,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.65779 samples/s/p 0:29:43 } +2024-07-30 05:40:44,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1866/ 3125], loss: 0.310, per_step_time: 1414ms, lr: 4.6560555e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:44,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.65716 samples/s/p 0:29:40 } +2024-07-30 05:40:47,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1868/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 4.641509e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:47,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.65791 samples/s/p 0:29:37 } +2024-07-30 05:40:50,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1870/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 4.6269832e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:50,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.65872 samples/s/p 0:29:34 } +2024-07-30 05:40:52,840 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1872/ 3125], loss: 0.387, per_step_time: 1413ms, lr: 4.6124725e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:52,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.66053 samples/s/p 0:29:30 } +2024-07-30 05:40:55,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1874/ 3125], loss: 0.357, per_step_time: 1412ms, lr: 4.5979917e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:55,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.66173 samples/s/p 0:29:27 } +2024-07-30 05:40:58,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1876/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 4.5835316e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:40:58,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.66036 samples/s/p 0:29:25 } +2024-07-30 05:41:01,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1878/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 4.5690953e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:01,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.66156 samples/s/p 0:29:22 } +2024-07-30 05:41:04,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1880/ 3125], loss: 0.405, per_step_time: 1414ms, lr: 4.554677e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:04,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.65667 samples/s/p 0:29:20 } +2024-07-30 05:41:07,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1882/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 4.5402763e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:07,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.65980 samples/s/p 0:29:16 } +2024-07-30 05:41:09,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1884/ 3125], loss: 0.185, per_step_time: 1414ms, lr: 4.5259057e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:09,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.65522 samples/s/p 0:29:15 } +2024-07-30 05:41:12,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1886/ 3125], loss: 0.212, per_step_time: 1414ms, lr: 4.51155e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:12,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.65421 samples/s/p 0:29:13 } +2024-07-30 05:41:15,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1888/ 3125], loss: 0.370, per_step_time: 1414ms, lr: 4.497218e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:15,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.65602 samples/s/p 0:29:09 } +2024-07-30 05:41:18,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1890/ 3125], loss: 0.436, per_step_time: 1413ms, lr: 4.482907e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:18,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.66128 samples/s/p 0:29:05 } +2024-07-30 05:41:21,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1892/ 3125], loss: 0.427, per_step_time: 1413ms, lr: 4.4686226e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:21,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.65998 samples/s/p 0:29:02 } +2024-07-30 05:41:24,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1894/ 3125], loss: 0.375, per_step_time: 1413ms, lr: 4.4543594e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:24,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.65905 samples/s/p 0:29:00 } +2024-07-30 05:41:26,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1896/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 4.440114e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:26,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.65788 samples/s/p 0:28:57 } +2024-07-30 05:41:29,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1898/ 3125], loss: 0.309, per_step_time: 1413ms, lr: 4.4258923e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:29,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.65989 samples/s/p 0:28:54 } +2024-07-30 05:41:32,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1900/ 3125], loss: 0.282, per_step_time: 1425ms, lr: 4.4116854e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:32,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.61331 samples/s/p 0:29:05 } +2024-07-30 05:41:35,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1902/ 3125], loss: 0.268, per_step_time: 1413ms, lr: 4.3975083e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:35,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.66077 samples/s/p 0:28:48 } +2024-07-30 05:41:38,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1904/ 3125], loss: 0.279, per_step_time: 1413ms, lr: 4.3833552e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:38,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.66149 samples/s/p 0:28:45 } +2024-07-30 05:41:41,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1906/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 4.369217e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:41,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.66165 samples/s/p 0:28:42 } +2024-07-30 05:41:43,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1908/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 4.3550997e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:43,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.66054 samples/s/p 0:28:39 } +2024-07-30 05:41:46,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1910/ 3125], loss: 0.236, per_step_time: 1412ms, lr: 4.3410122e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:46,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.66235 samples/s/p 0:28:36 } +2024-07-30 05:41:49,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1912/ 3125], loss: 0.141, per_step_time: 1413ms, lr: 4.3269455e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:49,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.65931 samples/s/p 0:28:34 } +2024-07-30 05:41:52,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1914/ 3125], loss: 0.216, per_step_time: 1412ms, lr: 4.3128907e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:52,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.66181 samples/s/p 0:28:31 } +2024-07-30 05:41:55,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1916/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 4.2988657e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:55,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.66017 samples/s/p 0:28:28 } +2024-07-30 05:41:58,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1918/ 3125], loss: 0.416, per_step_time: 1413ms, lr: 4.2848615e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:41:58,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.66163 samples/s/p 0:28:25 } +2024-07-30 05:42:00,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1920/ 3125], loss: 0.474, per_step_time: 1413ms, lr: 4.2708783e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:00,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.66134 samples/s/p 0:28:22 } +2024-07-30 05:42:03,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1922/ 3125], loss: 0.104, per_step_time: 1413ms, lr: 4.2569218e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:03,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.66121 samples/s/p 0:28:19 } +2024-07-30 05:42:06,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1924/ 3125], loss: 0.437, per_step_time: 1413ms, lr: 4.2429835e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:06,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.65894 samples/s/p 0:28:17 } +2024-07-30 05:42:09,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1926/ 3125], loss: 0.358, per_step_time: 1413ms, lr: 4.2290628e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:09,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.66013 samples/s/p 0:28:14 } +2024-07-30 05:42:12,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1928/ 3125], loss: 0.454, per_step_time: 1413ms, lr: 4.215169e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:12,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.66035 samples/s/p 0:28:11 } +2024-07-30 05:42:15,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1930/ 3125], loss: 0.215, per_step_time: 1412ms, lr: 4.20129e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:15,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.66280 samples/s/p 0:28:08 } +2024-07-30 05:42:17,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1932/ 3125], loss: 0.346, per_step_time: 1413ms, lr: 4.1874407e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:17,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.66154 samples/s/p 0:28:05 } +2024-07-30 05:42:20,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1934/ 3125], loss: 0.110, per_step_time: 1414ms, lr: 4.1736124e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:20,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.65622 samples/s/p 0:28:04 } +2024-07-30 05:42:23,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1936/ 3125], loss: 0.433, per_step_time: 1413ms, lr: 4.159802e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:23,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.65839 samples/s/p 0:28:01 } +2024-07-30 05:42:26,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1938/ 3125], loss: 0.167, per_step_time: 1413ms, lr: 4.1460186e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:26,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.65971 samples/s/p 0:27:57 } +2024-07-30 05:42:29,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1940/ 3125], loss: 0.112, per_step_time: 1413ms, lr: 4.132256e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:29,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.66122 samples/s/p 0:27:54 } +2024-07-30 05:42:32,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1942/ 3125], loss: 0.137, per_step_time: 1416ms, lr: 4.118514e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:32,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.64958 samples/s/p 0:27:55 } +2024-07-30 05:42:34,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1944/ 3125], loss: 0.308, per_step_time: 1414ms, lr: 4.10479e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:34,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.65730 samples/s/p 0:27:50 } +2024-07-30 05:42:37,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1946/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 4.091096e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:37,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.65975 samples/s/p 0:27:46 } +2024-07-30 05:42:40,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1948/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 4.0774196e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:40,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.66006 samples/s/p 0:27:43 } +2024-07-30 05:42:43,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1950/ 3125], loss: 0.188, per_step_time: 1413ms, lr: 4.063761e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:43,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.65863 samples/s/p 0:27:41 } +2024-07-30 05:42:46,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1952/ 3125], loss: 0.390, per_step_time: 1413ms, lr: 4.0501297e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:46,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.65919 samples/s/p 0:27:38 } +2024-07-30 05:42:49,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1954/ 3125], loss: 0.410, per_step_time: 1413ms, lr: 4.0365188e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:49,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.66085 samples/s/p 0:27:34 } +2024-07-30 05:42:51,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1956/ 3125], loss: 0.320, per_step_time: 1412ms, lr: 4.0229318e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:51,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.66227 samples/s/p 0:27:31 } +2024-07-30 05:42:54,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1958/ 3125], loss: 0.266, per_step_time: 1412ms, lr: 4.00936e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:54,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.66215 samples/s/p 0:27:28 } +2024-07-30 05:42:57,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1960/ 3125], loss: 0.147, per_step_time: 1418ms, lr: 3.995821e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:42:57,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.64095 samples/s/p 0:27:32 } +2024-07-30 05:43:00,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1962/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 3.9822964e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:00,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.65997 samples/s/p 0:27:23 } +2024-07-30 05:43:03,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1964/ 3125], loss: 0.287, per_step_time: 1412ms, lr: 3.968799e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:03,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.66322 samples/s/p 0:27:20 } +2024-07-30 05:43:06,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1966/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 3.9553166e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:06,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.65997 samples/s/p 0:27:18 } +2024-07-30 05:43:08,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1968/ 3125], loss: 0.158, per_step_time: 1413ms, lr: 3.9418606e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:08,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.65997 samples/s/p 0:27:15 } +2024-07-30 05:43:11,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1970/ 3125], loss: 0.176, per_step_time: 1413ms, lr: 3.9284288e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:11,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.65860 samples/s/p 0:27:12 } +2024-07-30 05:43:14,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1972/ 3125], loss: 0.169, per_step_time: 1413ms, lr: 3.9150117e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:14,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.65900 samples/s/p 0:27:09 } +2024-07-30 05:43:17,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1974/ 3125], loss: 0.306, per_step_time: 1415ms, lr: 3.9016186e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:17,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.65327 samples/s/p 0:27:08 } +2024-07-30 05:43:20,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1976/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 3.888252e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:20,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.65949 samples/s/p 0:27:04 } +2024-07-30 05:43:23,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1978/ 3125], loss: 0.349, per_step_time: 1413ms, lr: 3.874904e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:23,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.65994 samples/s/p 0:27:01 } +2024-07-30 05:43:25,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1980/ 3125], loss: 0.322, per_step_time: 1413ms, lr: 3.8615792e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:25,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.66145 samples/s/p 0:26:57 } +2024-07-30 05:43:28,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1982/ 3125], loss: 0.388, per_step_time: 1413ms, lr: 3.8482784e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:28,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.65799 samples/s/p 0:26:56 } +2024-07-30 05:43:31,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1984/ 3125], loss: 0.371, per_step_time: 1413ms, lr: 3.8349955e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:31,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.65991 samples/s/p 0:26:52 } +2024-07-30 05:43:34,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1986/ 3125], loss: 0.249, per_step_time: 1416ms, lr: 3.8217425e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:34,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.64908 samples/s/p 0:26:53 } +2024-07-30 05:43:37,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1988/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 3.8085014e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:37,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.66099 samples/s/p 0:26:46 } +2024-07-30 05:43:40,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1990/ 3125], loss: 0.203, per_step_time: 1415ms, lr: 3.795287e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:40,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.65338 samples/s/p 0:26:46 } +2024-07-30 05:43:42,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1992/ 3125], loss: 0.162, per_step_time: 1412ms, lr: 3.7820934e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:42,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.66307 samples/s/p 0:26:40 } +2024-07-30 05:43:45,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1994/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 3.7689267e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:45,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.65939 samples/s/p 0:26:38 } +2024-07-30 05:43:48,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1996/ 3125], loss: 0.317, per_step_time: 1414ms, lr: 3.755772e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:48,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |███████████████████████████████████████████ | 5.65678 samples/s/p 0:26:36 } +2024-07-30 05:43:51,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 1998/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 3.7426472e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:51,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |███████████████████████████████████████████ | 5.65833 samples/s/p 0:26:33 } +2024-07-30 05:43:54,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2000/ 3125], loss: 0.219, per_step_time: 1414ms, lr: 3.729546e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:54,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.65642 samples/s/p 0:26:31 } +2024-07-30 05:43:57,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2002/ 3125], loss: 0.322, per_step_time: 1414ms, lr: 3.7164597e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:57,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.65728 samples/s/p 0:26:28 } +2024-07-30 05:43:59,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2004/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 3.7034005e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:43:59,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.66071 samples/s/p 0:26:24 } +2024-07-30 05:44:02,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2006/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 3.690362e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:02,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.65900 samples/s/p 0:26:21 } +2024-07-30 05:44:05,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2008/ 3125], loss: 0.410, per_step_time: 1412ms, lr: 3.677347e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:05,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.66273 samples/s/p 0:26:18 } +2024-07-30 05:44:08,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2010/ 3125], loss: 0.255, per_step_time: 1413ms, lr: 3.6643564e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:08,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.66056 samples/s/p 0:26:15 } +2024-07-30 05:44:11,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2012/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 3.6513865e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:11,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.65952 samples/s/p 0:26:13 } +2024-07-30 05:44:14,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2014/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 3.6384372e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:14,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.66024 samples/s/p 0:26:10 } +2024-07-30 05:44:16,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2016/ 3125], loss: 0.380, per_step_time: 1412ms, lr: 3.625506e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:16,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.66233 samples/s/p 0:26:06 } +2024-07-30 05:44:19,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2018/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 3.6126016e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:19,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.65986 samples/s/p 0:26:04 } +2024-07-30 05:44:22,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2020/ 3125], loss: 0.414, per_step_time: 1413ms, lr: 3.599718e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:22,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.66116 samples/s/p 0:26:01 } +2024-07-30 05:44:25,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2022/ 3125], loss: 0.103, per_step_time: 1413ms, lr: 3.5868555e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:25,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.66081 samples/s/p 0:25:58 } +2024-07-30 05:44:28,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2024/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 3.5740166e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:28,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.66150 samples/s/p 0:25:55 } +2024-07-30 05:44:31,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2026/ 3125], loss: 0.157, per_step_time: 1413ms, lr: 3.5612015e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:31,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.66090 samples/s/p 0:25:53 } +2024-07-30 05:44:33,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2028/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 3.5484044e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:33,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.66083 samples/s/p 0:25:50 } +2024-07-30 05:44:36,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2030/ 3125], loss: 0.238, per_step_time: 1413ms, lr: 3.535631e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:36,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.65786 samples/s/p 0:25:48 } +2024-07-30 05:44:39,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2032/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 3.5228848e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:39,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.66035 samples/s/p 0:25:44 } +2024-07-30 05:44:42,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2034/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 3.5101561e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:42,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.66055 samples/s/p 0:25:41 } +2024-07-30 05:44:45,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2036/ 3125], loss: 0.307, per_step_time: 1413ms, lr: 3.4974514e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:45,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.66025 samples/s/p 0:25:39 } +2024-07-30 05:44:48,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2038/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 3.4847704e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:48,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.65869 samples/s/p 0:25:36 } +2024-07-30 05:44:50,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2040/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 3.4721046e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:50,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.65990 samples/s/p 0:25:33 } +2024-07-30 05:44:53,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2042/ 3125], loss: 0.288, per_step_time: 1414ms, lr: 3.4594655e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:53,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.65686 samples/s/p 0:25:31 } +2024-07-30 05:44:56,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2044/ 3125], loss: 0.271, per_step_time: 1414ms, lr: 3.446847e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:56,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.65763 samples/s/p 0:25:28 } +2024-07-30 05:44:59,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2046/ 3125], loss: 0.145, per_step_time: 1414ms, lr: 3.4342526e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:44:59,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.65607 samples/s/p 0:25:26 } +2024-07-30 05:45:02,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2048/ 3125], loss: 0.373, per_step_time: 1412ms, lr: 3.421682e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:02,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.66192 samples/s/p 0:25:21 } +2024-07-30 05:45:05,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2050/ 3125], loss: 0.396, per_step_time: 1413ms, lr: 3.4091323e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:05,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.65932 samples/s/p 0:25:19 } +2024-07-30 05:45:07,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2052/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 3.3966063e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:07,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.65990 samples/s/p 0:25:16 } +2024-07-30 05:45:10,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2054/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 3.3841013e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:10,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.65887 samples/s/p 0:25:14 } +2024-07-30 05:45:13,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2056/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 3.3716202e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:13,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.66056 samples/s/p 0:25:10 } +2024-07-30 05:45:16,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2058/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 3.3591598e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:16,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.65753 samples/s/p 0:25:08 } +2024-07-30 05:45:19,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2060/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 3.3467143e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:19,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.65925 samples/s/p 0:25:05 } +2024-07-30 05:45:22,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2062/ 3125], loss: 0.276, per_step_time: 1418ms, lr: 3.3342985e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:22,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.64109 samples/s/p 0:25:07 } +2024-07-30 05:45:24,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2064/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 3.321907e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:24,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.66085 samples/s/p 0:24:59 } +2024-07-30 05:45:27,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2066/ 3125], loss: 0.146, per_step_time: 1412ms, lr: 3.30953e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:27,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.66231 samples/s/p 0:24:56 } +2024-07-30 05:45:30,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2068/ 3125], loss: 0.238, per_step_time: 1417ms, lr: 3.297183e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:30,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.64305 samples/s/p 0:24:58 } +2024-07-30 05:45:33,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2070/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 3.2848595e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:33,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.66048 samples/s/p 0:24:51 } +2024-07-30 05:45:36,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2072/ 3125], loss: 0.483, per_step_time: 1413ms, lr: 3.272554e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:36,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.65794 samples/s/p 0:24:48 } +2024-07-30 05:45:39,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2074/ 3125], loss: 0.392, per_step_time: 1415ms, lr: 3.2602668e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:39,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.65077 samples/s/p 0:24:47 } +2024-07-30 05:45:41,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2076/ 3125], loss: 0.204, per_step_time: 1414ms, lr: 3.248009e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:41,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.65718 samples/s/p 0:24:43 } +2024-07-30 05:45:44,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2078/ 3125], loss: 0.225, per_step_time: 1413ms, lr: 3.2357693e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:44,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.65782 samples/s/p 0:24:40 } +2024-07-30 05:45:47,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2080/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 3.2235562e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:47,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.65937 samples/s/p 0:24:37 } +2024-07-30 05:45:50,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2082/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 3.211364e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:50,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.66053 samples/s/p 0:24:34 } +2024-07-30 05:45:53,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2084/ 3125], loss: 0.415, per_step_time: 1413ms, lr: 3.19919e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:53,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.66152 samples/s/p 0:24:30 } +2024-07-30 05:45:56,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2086/ 3125], loss: 0.434, per_step_time: 1413ms, lr: 3.1870425e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:56,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.66159 samples/s/p 0:24:28 } +2024-07-30 05:45:58,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2088/ 3125], loss: 0.105, per_step_time: 1413ms, lr: 3.17491e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:45:58,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.66061 samples/s/p 0:24:25 } +2024-07-30 05:46:01,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2090/ 3125], loss: 0.137, per_step_time: 1412ms, lr: 3.1628102e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:01,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.66241 samples/s/p 0:24:22 } +2024-07-30 05:46:04,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2092/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 3.1507284e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:04,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.65885 samples/s/p 0:24:20 } +2024-07-30 05:46:07,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2094/ 3125], loss: 0.174, per_step_time: 1414ms, lr: 3.1386702e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:07,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.65729 samples/s/p 0:24:17 } +2024-07-30 05:46:10,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2096/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 3.126633e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:10,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.66090 samples/s/p 0:24:14 } +2024-07-30 05:46:13,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2098/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 3.1146197e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:13,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.66113 samples/s/p 0:24:11 } +2024-07-30 05:46:15,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2100/ 3125], loss: 0.144, per_step_time: 1414ms, lr: 3.1026272e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:15,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.65647 samples/s/p 0:24:09 } +2024-07-30 05:46:18,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2102/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 3.0906529e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:18,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.65771 samples/s/p 0:24:06 } +2024-07-30 05:46:21,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2104/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 3.078708e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:21,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.65906 samples/s/p 0:24:03 } +2024-07-30 05:46:24,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2106/ 3125], loss: 0.302, per_step_time: 1412ms, lr: 3.066784e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:24,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.66221 samples/s/p 0:23:59 } +2024-07-30 05:46:27,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2108/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 3.0548782e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:27,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.65830 samples/s/p 0:23:57 } +2024-07-30 05:46:30,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2110/ 3125], loss: 0.341, per_step_time: 1413ms, lr: 3.0429987e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:30,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.66100 samples/s/p 0:23:54 } +2024-07-30 05:46:32,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2112/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 3.0311435e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:32,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.65883 samples/s/p 0:23:52 } +2024-07-30 05:46:35,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2114/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 3.019309e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:35,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.65976 samples/s/p 0:23:49 } +2024-07-30 05:46:38,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2116/ 3125], loss: 0.170, per_step_time: 1413ms, lr: 3.0074892e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:38,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.66061 samples/s/p 0:23:45 } +2024-07-30 05:46:41,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2118/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 2.9957056e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:41,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.65903 samples/s/p 0:23:43 } +2024-07-30 05:46:44,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2120/ 3125], loss: 0.374, per_step_time: 1414ms, lr: 2.9839336e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:44,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.65678 samples/s/p 0:23:41 } +2024-07-30 05:46:47,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2122/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 2.9721915e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:47,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.65919 samples/s/p 0:23:37 } +2024-07-30 05:46:49,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2124/ 3125], loss: 0.254, per_step_time: 1412ms, lr: 2.9604672e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:49,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.66263 samples/s/p 0:23:34 } +2024-07-30 05:46:52,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2126/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 2.94877e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:52,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.66121 samples/s/p 0:23:31 } +2024-07-30 05:46:55,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2128/ 3125], loss: 0.204, per_step_time: 1413ms, lr: 2.9370904e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:55,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.65933 samples/s/p 0:23:29 } +2024-07-30 05:46:58,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2130/ 3125], loss: 0.234, per_step_time: 1412ms, lr: 2.9254346e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:46:58,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.66181 samples/s/p 0:23:25 } +2024-07-30 05:47:01,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2132/ 3125], loss: 0.417, per_step_time: 1413ms, lr: 2.9138e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:01,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.65849 samples/s/p 0:23:23 } +2024-07-30 05:47:04,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2134/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 2.9021888e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:04,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.65922 samples/s/p 0:23:20 } +2024-07-30 05:47:06,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2136/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 2.8905987e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:06,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.65820 samples/s/p 0:23:18 } +2024-07-30 05:47:09,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2138/ 3125], loss: 0.503, per_step_time: 1413ms, lr: 2.8790353e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:09,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.65978 samples/s/p 0:23:15 } +2024-07-30 05:47:12,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2140/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 2.8674899e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:12,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.65802 samples/s/p 0:23:12 } +2024-07-30 05:47:15,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2142/ 3125], loss: 0.380, per_step_time: 1413ms, lr: 2.8559742e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:15,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.65791 samples/s/p 0:23:09 } +2024-07-30 05:47:18,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2144/ 3125], loss: 0.340, per_step_time: 1413ms, lr: 2.8444765e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:18,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.65781 samples/s/p 0:23:07 } +2024-07-30 05:47:21,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2146/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 2.8329998e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:21,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.65988 samples/s/p 0:23:03 } +2024-07-30 05:47:23,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2148/ 3125], loss: 0.317, per_step_time: 1414ms, lr: 2.8215436e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:23,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.65729 samples/s/p 0:23:01 } +2024-07-30 05:47:26,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2150/ 3125], loss: 0.360, per_step_time: 1413ms, lr: 2.8101147e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:47:26,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.66038 samples/s/p 0:22:57 } +2024-07-30 05:47:26,827 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 05:48:03,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2152/ 3125], loss: 0.418, per_step_time: 2166ms, lr: 2.7987033e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:03,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 3.69220 samples/s/p 0:35:08 } +2024-07-30 05:48:06,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2154/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 2.7873187e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:06,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.66115 samples/s/p 0:22:52 } +2024-07-30 05:48:08,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2156/ 3125], loss: 0.291, per_step_time: 1413ms, lr: 2.7759552e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:08,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.65908 samples/s/p 0:22:49 } +2024-07-30 05:48:11,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2158/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 2.7646155e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:11,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.65946 samples/s/p 0:22:46 } +2024-07-30 05:48:14,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2160/ 3125], loss: 0.600, per_step_time: 1413ms, lr: 2.7532965e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:14,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.65945 samples/s/p 0:22:44 } +2024-07-30 05:48:17,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2162/ 3125], loss: 0.405, per_step_time: 1413ms, lr: 2.7420015e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:17,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.65830 samples/s/p 0:22:41 } +2024-07-30 05:48:20,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2164/ 3125], loss: 0.299, per_step_time: 1414ms, lr: 2.7307271e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:20,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.65589 samples/s/p 0:22:39 } +2024-07-30 05:48:23,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2166/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 2.7194767e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:23,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.66083 samples/s/p 0:22:35 } +2024-07-30 05:48:25,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2168/ 3125], loss: 0.133, per_step_time: 1414ms, lr: 2.7082532e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:25,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.65557 samples/s/p 0:22:33 } +2024-07-30 05:48:28,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2170/ 3125], loss: 0.173, per_step_time: 1414ms, lr: 2.6970474e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:28,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.65704 samples/s/p 0:22:30 } +2024-07-30 05:48:31,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2172/ 3125], loss: 0.375, per_step_time: 1414ms, lr: 2.6858626e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:31,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.65632 samples/s/p 0:22:27 } +2024-07-30 05:48:34,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2174/ 3125], loss: 0.299, per_step_time: 1413ms, lr: 2.6747017e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:34,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.66083 samples/s/p 0:22:23 } +2024-07-30 05:48:37,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2176/ 3125], loss: 0.295, per_step_time: 1413ms, lr: 2.6635615e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:37,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.66021 samples/s/p 0:22:21 } +2024-07-30 05:48:40,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2178/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 2.6524512e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:40,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.65912 samples/s/p 0:22:18 } +2024-07-30 05:48:42,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2180/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 2.641356e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:42,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.65953 samples/s/p 0:22:15 } +2024-07-30 05:48:45,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2182/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 2.6302874e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:45,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.65952 samples/s/p 0:22:12 } +2024-07-30 05:48:48,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2184/ 3125], loss: 0.419, per_step_time: 1413ms, lr: 2.6192455e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:48,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |████████████████████████████████████████████ | 5.65839 samples/s/p 0:22:10 } +2024-07-30 05:48:51,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2186/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 2.6082188e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:51,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |████████████████████████████████████████████ | 5.66019 samples/s/p 0:22:07 } +2024-07-30 05:48:54,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2188/ 3125], loss: 0.160, per_step_time: 1414ms, lr: 2.5972128e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:54,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.65417 samples/s/p 0:22:05 } +2024-07-30 05:48:57,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2190/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 2.5862366e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:57,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.65972 samples/s/p 0:22:01 } +2024-07-30 05:48:59,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2192/ 3125], loss: 0.316, per_step_time: 1413ms, lr: 2.5752811e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:48:59,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.66130 samples/s/p 0:21:58 } +2024-07-30 05:49:02,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2194/ 3125], loss: 0.146, per_step_time: 1413ms, lr: 2.5643467e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:02,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.66064 samples/s/p 0:21:55 } +2024-07-30 05:49:05,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2196/ 3125], loss: 0.307, per_step_time: 1412ms, lr: 2.553433e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:05,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.66220 samples/s/p 0:21:52 } +2024-07-30 05:49:08,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2198/ 3125], loss: 0.243, per_step_time: 1414ms, lr: 2.5425493e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:08,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.65618 samples/s/p 0:21:51 } +2024-07-30 05:49:11,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2200/ 3125], loss: 0.187, per_step_time: 1414ms, lr: 2.5316834e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:11,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.65598 samples/s/p 0:21:48 } +2024-07-30 05:49:14,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2202/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 2.5208382e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:14,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.66111 samples/s/p 0:21:44 } +2024-07-30 05:49:16,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2204/ 3125], loss: 0.325, per_step_time: 1414ms, lr: 2.5100172e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:16,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.65650 samples/s/p 0:21:42 } +2024-07-30 05:49:19,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2206/ 3125], loss: 0.207, per_step_time: 1413ms, lr: 2.4992198e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:19,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.66147 samples/s/p 0:21:38 } +2024-07-30 05:49:22,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2208/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 2.4884463e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:22,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.66168 samples/s/p 0:21:35 } +2024-07-30 05:49:25,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2210/ 3125], loss: 0.173, per_step_time: 1413ms, lr: 2.4776935e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:25,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.65993 samples/s/p 0:21:33 } +2024-07-30 05:49:28,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2212/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 2.4669646e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:28,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.65946 samples/s/p 0:21:30 } +2024-07-30 05:49:31,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2214/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 2.4562596e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:31,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.65856 samples/s/p 0:21:27 } +2024-07-30 05:49:33,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2216/ 3125], loss: 0.425, per_step_time: 1414ms, lr: 2.4455724e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:33,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.65692 samples/s/p 0:21:25 } +2024-07-30 05:49:36,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2218/ 3125], loss: 0.370, per_step_time: 1415ms, lr: 2.4349092e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:36,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.65315 samples/s/p 0:21:23 } +2024-07-30 05:49:39,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2220/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 2.424267e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:39,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.66135 samples/s/p 0:21:18 } +2024-07-30 05:49:42,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2222/ 3125], loss: 0.233, per_step_time: 1414ms, lr: 2.4136511e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:42,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.65555 samples/s/p 0:21:17 } +2024-07-30 05:49:45,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2224/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 2.4030626e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:45,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.66002 samples/s/p 0:21:13 } +2024-07-30 05:49:48,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2226/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 2.3924918e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:48,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.66064 samples/s/p 0:21:10 } +2024-07-30 05:49:50,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2228/ 3125], loss: 0.080, per_step_time: 1413ms, lr: 2.3819446e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:50,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.66011 samples/s/p 0:21:07 } +2024-07-30 05:49:53,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2230/ 3125], loss: 0.273, per_step_time: 1412ms, lr: 2.3714185e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:53,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.66304 samples/s/p 0:21:04 } +2024-07-30 05:49:56,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2232/ 3125], loss: 0.119, per_step_time: 1413ms, lr: 2.3609131e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:56,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.66072 samples/s/p 0:21:02 } +2024-07-30 05:49:59,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2234/ 3125], loss: 0.201, per_step_time: 1412ms, lr: 2.3504346e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:49:59,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.66276 samples/s/p 0:20:58 } +2024-07-30 05:50:02,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2236/ 3125], loss: 0.298, per_step_time: 1412ms, lr: 2.339977e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:02,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.66335 samples/s/p 0:20:55 } +2024-07-30 05:50:05,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2238/ 3125], loss: 0.213, per_step_time: 1414ms, lr: 2.3295432e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:05,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.65695 samples/s/p 0:20:54 } +2024-07-30 05:50:07,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2240/ 3125], loss: 0.159, per_step_time: 1413ms, lr: 2.3191302e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:07,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.66059 samples/s/p 0:20:50 } +2024-07-30 05:50:10,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2242/ 3125], loss: 0.452, per_step_time: 1413ms, lr: 2.3087412e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:10,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.65870 samples/s/p 0:20:48 } +2024-07-30 05:50:13,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2244/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 2.298379e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:13,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.66001 samples/s/p 0:20:45 } +2024-07-30 05:50:16,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2246/ 3125], loss: 0.451, per_step_time: 1413ms, lr: 2.2880344e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:16,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.65969 samples/s/p 0:20:42 } +2024-07-30 05:50:19,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2248/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 2.277714e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:19,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.66035 samples/s/p 0:20:39 } +2024-07-30 05:50:22,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2250/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 2.2674172e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:22,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.65997 samples/s/p 0:20:36 } +2024-07-30 05:50:24,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2252/ 3125], loss: 0.304, per_step_time: 1414ms, lr: 2.2571385e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:24,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.65746 samples/s/p 0:20:34 } +2024-07-30 05:50:27,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2254/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 2.2468895e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:27,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.65786 samples/s/p 0:20:31 } +2024-07-30 05:50:30,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2256/ 3125], loss: 0.151, per_step_time: 1412ms, lr: 2.2366582e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:30,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.66207 samples/s/p 0:20:27 } +2024-07-30 05:50:33,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2258/ 3125], loss: 0.187, per_step_time: 1414ms, lr: 2.226451e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:33,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.65640 samples/s/p 0:20:26 } +2024-07-30 05:50:36,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2260/ 3125], loss: 0.350, per_step_time: 1414ms, lr: 2.2162705e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:36,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.65587 samples/s/p 0:20:23 } +2024-07-30 05:50:39,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2262/ 3125], loss: 0.150, per_step_time: 1413ms, lr: 2.2061108e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:39,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.65907 samples/s/p 0:20:19 } +2024-07-30 05:50:41,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2264/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 2.1959691e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:41,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.66104 samples/s/p 0:20:16 } +2024-07-30 05:50:44,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2266/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 2.1858513e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:44,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.66160 samples/s/p 0:20:13 } +2024-07-30 05:50:47,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2268/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 2.1757631e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:47,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.65775 samples/s/p 0:20:11 } +2024-07-30 05:50:50,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2270/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 2.165693e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:50,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.66149 samples/s/p 0:20:08 } +2024-07-30 05:50:53,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2272/ 3125], loss: 0.159, per_step_time: 1412ms, lr: 2.1556467e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:53,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.66235 samples/s/p 0:20:05 } +2024-07-30 05:50:56,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2274/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 2.145627e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:56,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.65912 samples/s/p 0:20:03 } +2024-07-30 05:50:58,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2276/ 3125], loss: 0.102, per_step_time: 1413ms, lr: 2.1356195e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:50:58,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.65998 samples/s/p 0:20:00 } +2024-07-30 05:51:01,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2278/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 2.1256416e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:01,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.65806 samples/s/p 0:19:57 } +2024-07-30 05:51:04,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2280/ 3125], loss: 0.277, per_step_time: 1414ms, lr: 2.1156906e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:04,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.65596 samples/s/p 0:19:55 } +2024-07-30 05:51:07,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2282/ 3125], loss: 0.166, per_step_time: 1415ms, lr: 2.1057605e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:07,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.65282 samples/s/p 0:19:53 } +2024-07-30 05:51:10,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2284/ 3125], loss: 0.233, per_step_time: 1415ms, lr: 2.0958453e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:10,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.65206 samples/s/p 0:19:50 } +2024-07-30 05:51:13,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2286/ 3125], loss: 0.250, per_step_time: 1415ms, lr: 2.0859599e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:13,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.65370 samples/s/p 0:19:47 } +2024-07-30 05:51:15,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2288/ 3125], loss: 0.260, per_step_time: 1413ms, lr: 2.0760953e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:15,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.65985 samples/s/p 0:19:43 } +2024-07-30 05:51:18,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2290/ 3125], loss: 0.222, per_step_time: 1413ms, lr: 2.0662516e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:18,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.65842 samples/s/p 0:19:40 } +2024-07-30 05:51:21,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2292/ 3125], loss: 0.436, per_step_time: 1413ms, lr: 2.0564347e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:21,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.65801 samples/s/p 0:19:37 } +2024-07-30 05:51:24,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2294/ 3125], loss: 0.319, per_step_time: 1412ms, lr: 2.0466386e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:24,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.66244 samples/s/p 0:19:34 } +2024-07-30 05:51:27,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2296/ 3125], loss: 0.166, per_step_time: 1416ms, lr: 2.0368695e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:27,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.64955 samples/s/p 0:19:33 } +2024-07-30 05:51:30,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2298/ 3125], loss: 0.158, per_step_time: 1412ms, lr: 2.0271182e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:30,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.66262 samples/s/p 0:19:28 } +2024-07-30 05:51:32,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2300/ 3125], loss: 0.330, per_step_time: 1413ms, lr: 2.0173967e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:32,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.66167 samples/s/p 0:19:25 } +2024-07-30 05:51:35,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2302/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 2.007693e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:35,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.66078 samples/s/p 0:19:23 } +2024-07-30 05:51:38,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2304/ 3125], loss: 0.224, per_step_time: 1413ms, lr: 1.9980102e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:38,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.66151 samples/s/p 0:19:20 } +2024-07-30 05:51:41,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2306/ 3125], loss: 0.122, per_step_time: 1412ms, lr: 1.9883512e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:41,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.66205 samples/s/p 0:19:17 } +2024-07-30 05:51:44,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2308/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 1.9787161e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:44,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.66171 samples/s/p 0:19:14 } +2024-07-30 05:51:47,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2310/ 3125], loss: 0.457, per_step_time: 1412ms, lr: 1.969102e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:47,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.66205 samples/s/p 0:19:11 } +2024-07-30 05:51:49,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2312/ 3125], loss: 0.337, per_step_time: 1413ms, lr: 1.9595146e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:49,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.66161 samples/s/p 0:19:08 } +2024-07-30 05:51:52,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2314/ 3125], loss: 0.172, per_step_time: 1413ms, lr: 1.949951e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:52,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.66153 samples/s/p 0:19:05 } +2024-07-30 05:51:55,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2316/ 3125], loss: 0.174, per_step_time: 1413ms, lr: 1.9404054e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:55,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.66132 samples/s/p 0:19:03 } +2024-07-30 05:51:58,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2318/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 1.9308835e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:51:58,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.65818 samples/s/p 0:19:01 } +2024-07-30 05:52:01,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2320/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 1.9213884e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:01,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.65774 samples/s/p 0:18:58 } +2024-07-30 05:52:04,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2322/ 3125], loss: 0.131, per_step_time: 1414ms, lr: 1.9119173e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:04,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.65562 samples/s/p 0:18:55 } +2024-07-30 05:52:06,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2324/ 3125], loss: 0.200, per_step_time: 1413ms, lr: 1.902464e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:06,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.65972 samples/s/p 0:18:52 } +2024-07-30 05:52:09,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2326/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 1.8930375e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:09,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.66096 samples/s/p 0:18:49 } +2024-07-30 05:52:12,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2328/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 1.8836319e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:12,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.65981 samples/s/p 0:18:46 } +2024-07-30 05:52:15,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2330/ 3125], loss: 0.352, per_step_time: 1412ms, lr: 1.8742502e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:15,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.66253 samples/s/p 0:18:43 } +2024-07-30 05:52:18,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2332/ 3125], loss: 0.267, per_step_time: 1413ms, lr: 1.8648892e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:18,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.65869 samples/s/p 0:18:41 } +2024-07-30 05:52:21,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2334/ 3125], loss: 0.243, per_step_time: 1413ms, lr: 1.8555491e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:21,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.65928 samples/s/p 0:18:38 } +2024-07-30 05:52:23,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2336/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 1.8462389e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:23,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.65842 samples/s/p 0:18:35 } +2024-07-30 05:52:26,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2338/ 3125], loss: 0.314, per_step_time: 1414ms, lr: 1.8369495e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:26,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.65768 samples/s/p 0:18:32 } +2024-07-30 05:52:29,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2340/ 3125], loss: 0.076, per_step_time: 1413ms, lr: 1.827684e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:29,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.66158 samples/s/p 0:18:29 } +2024-07-30 05:52:32,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2342/ 3125], loss: 0.252, per_step_time: 1414ms, lr: 1.8184393e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:32,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.65404 samples/s/p 0:18:27 } +2024-07-30 05:52:35,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2344/ 3125], loss: 0.263, per_step_time: 1413ms, lr: 1.8092155e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:35,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.65968 samples/s/p 0:18:23 } +2024-07-30 05:52:38,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2346/ 3125], loss: 0.045, per_step_time: 1413ms, lr: 1.8000215e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:38,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.65929 samples/s/p 0:18:21 } +2024-07-30 05:52:40,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2348/ 3125], loss: 0.177, per_step_time: 1414ms, lr: 1.7908394e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:40,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.65579 samples/s/p 0:18:19 } +2024-07-30 05:52:43,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2350/ 3125], loss: 0.268, per_step_time: 1413ms, lr: 1.78169e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:43,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.65859 samples/s/p 0:18:15 } +2024-07-30 05:52:46,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2352/ 3125], loss: 0.405, per_step_time: 1413ms, lr: 1.7725617e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:46,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.66152 samples/s/p 0:18:12 } +2024-07-30 05:52:49,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2354/ 3125], loss: 0.392, per_step_time: 1413ms, lr: 1.7634571e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:49,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.66040 samples/s/p 0:18:09 } +2024-07-30 05:52:52,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2356/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 1.7543672e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:52,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.65923 samples/s/p 0:18:07 } +2024-07-30 05:52:55,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2358/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 1.7453104e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:55,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.65849 samples/s/p 0:18:04 } +2024-07-30 05:52:57,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2360/ 3125], loss: 0.342, per_step_time: 1413ms, lr: 1.7362743e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:52:57,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.65810 samples/s/p 0:18:01 } +2024-07-30 05:53:00,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2362/ 3125], loss: 0.292, per_step_time: 1414ms, lr: 1.7272562e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:00,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.65673 samples/s/p 0:17:59 } +2024-07-30 05:53:03,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2364/ 3125], loss: 0.434, per_step_time: 1413ms, lr: 1.7182677e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:03,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.65900 samples/s/p 0:17:55 } +2024-07-30 05:53:06,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2366/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 1.7093032e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:06,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.65930 samples/s/p 0:17:52 } +2024-07-30 05:53:09,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2368/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 1.7003566e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:09,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.65998 samples/s/p 0:17:49 } +2024-07-30 05:53:12,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2370/ 3125], loss: 0.115, per_step_time: 1412ms, lr: 1.6914368e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:12,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.66229 samples/s/p 0:17:46 } +2024-07-30 05:53:14,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2372/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 1.6825408e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:14,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |█████████████████████████████████████████████ | 5.66078 samples/s/p 0:17:44 } +2024-07-30 05:53:17,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2374/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 1.6736627e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:17,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |█████████████████████████████████████████████ | 5.66125 samples/s/p 0:17:41 } +2024-07-30 05:53:20,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2376/ 3125], loss: 0.204, per_step_time: 1412ms, lr: 1.6648083e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:20,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.66198 samples/s/p 0:17:38 } +2024-07-30 05:53:23,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2378/ 3125], loss: 0.217, per_step_time: 1413ms, lr: 1.655975e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:23,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.66026 samples/s/p 0:17:35 } +2024-07-30 05:53:26,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2380/ 3125], loss: 0.391, per_step_time: 1413ms, lr: 1.6471714e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:26,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.66119 samples/s/p 0:17:32 } +2024-07-30 05:53:29,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2382/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 1.6383856e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:29,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.66021 samples/s/p 0:17:30 } +2024-07-30 05:53:31,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2384/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 1.6296268e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:31,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.66111 samples/s/p 0:17:27 } +2024-07-30 05:53:34,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2386/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 1.6208917e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:34,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.65981 samples/s/p 0:17:24 } +2024-07-30 05:53:37,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2388/ 3125], loss: 0.043, per_step_time: 1413ms, lr: 1.6121744e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:37,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.65923 samples/s/p 0:17:21 } +2024-07-30 05:53:40,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2390/ 3125], loss: 0.206, per_step_time: 1413ms, lr: 1.603484e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:40,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.65986 samples/s/p 0:17:18 } +2024-07-30 05:53:43,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2392/ 3125], loss: 0.164, per_step_time: 1414ms, lr: 1.5948176e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:43,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.65527 samples/s/p 0:17:16 } +2024-07-30 05:53:46,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2394/ 3125], loss: 0.124, per_step_time: 1414ms, lr: 1.586169e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:46,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.65734 samples/s/p 0:17:13 } +2024-07-30 05:53:48,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2396/ 3125], loss: 0.369, per_step_time: 1414ms, lr: 1.5775501e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:48,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.65720 samples/s/p 0:17:10 } +2024-07-30 05:53:51,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2398/ 3125], loss: 0.399, per_step_time: 1413ms, lr: 1.5689491e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:51,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.65824 samples/s/p 0:17:07 } +2024-07-30 05:53:54,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2400/ 3125], loss: 0.256, per_step_time: 1413ms, lr: 1.560378e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:54,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.66073 samples/s/p 0:17:04 } +2024-07-30 05:53:57,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2402/ 3125], loss: 0.127, per_step_time: 1413ms, lr: 1.5518218e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:53:57,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.65848 samples/s/p 0:17:02 } +2024-07-30 05:54:00,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2404/ 3125], loss: 0.141, per_step_time: 1413ms, lr: 1.5432924e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:00,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.65914 samples/s/p 0:16:59 } +2024-07-30 05:54:03,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2406/ 3125], loss: 0.215, per_step_time: 1414ms, lr: 1.5347868e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:03,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.65757 samples/s/p 0:16:56 } +2024-07-30 05:54:05,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2408/ 3125], loss: 0.337, per_step_time: 1415ms, lr: 1.5263021e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:05,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.65367 samples/s/p 0:16:54 } +2024-07-30 05:54:08,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2410/ 3125], loss: 0.340, per_step_time: 1414ms, lr: 1.5178442e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:08,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.65746 samples/s/p 0:16:51 } +2024-07-30 05:54:11,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2412/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 1.509407e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:11,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.65820 samples/s/p 0:16:48 } +2024-07-30 05:54:14,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2414/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 1.5009999e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:14,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.65783 samples/s/p 0:16:45 } +2024-07-30 05:54:17,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2416/ 3125], loss: 0.377, per_step_time: 1413ms, lr: 1.4926076e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:17,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.66095 samples/s/p 0:16:41 } +2024-07-30 05:54:20,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2418/ 3125], loss: 0.317, per_step_time: 1413ms, lr: 1.4842361e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:20,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.65828 samples/s/p 0:16:39 } +2024-07-30 05:54:22,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2420/ 3125], loss: 0.278, per_step_time: 1413ms, lr: 1.4758915e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:22,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.66044 samples/s/p 0:16:36 } +2024-07-30 05:54:25,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2422/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 1.4675706e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:25,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.66075 samples/s/p 0:16:33 } +2024-07-30 05:54:28,659 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2424/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 1.4592736e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:28,660 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.66074 samples/s/p 0:16:30 } +2024-07-30 05:54:31,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2426/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 1.4509976e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:31,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.66022 samples/s/p 0:16:27 } +2024-07-30 05:54:34,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2428/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 1.4427512e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:34,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.66028 samples/s/p 0:16:25 } +2024-07-30 05:54:37,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2430/ 3125], loss: 0.204, per_step_time: 1412ms, lr: 1.4345228e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:37,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.66229 samples/s/p 0:16:21 } +2024-07-30 05:54:39,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2432/ 3125], loss: 0.290, per_step_time: 1413ms, lr: 1.4263212e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:39,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.65858 samples/s/p 0:16:19 } +2024-07-30 05:54:42,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2434/ 3125], loss: 0.252, per_step_time: 1412ms, lr: 1.4181346e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:42,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.66255 samples/s/p 0:16:16 } +2024-07-30 05:54:45,660 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2436/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 1.4099747e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:45,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.65952 samples/s/p 0:16:13 } +2024-07-30 05:54:48,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2438/ 3125], loss: 0.135, per_step_time: 1413ms, lr: 1.4018386e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:48,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.65996 samples/s/p 0:16:11 } +2024-07-30 05:54:51,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2440/ 3125], loss: 0.349, per_step_time: 1413ms, lr: 1.3937324e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:51,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.65888 samples/s/p 0:16:08 } +2024-07-30 05:54:54,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2442/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 1.385638e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:54,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.65862 samples/s/p 0:16:05 } +2024-07-30 05:54:56,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2444/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 1.3775735e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:56,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.66101 samples/s/p 0:16:02 } +2024-07-30 05:54:59,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2446/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 1.3695359e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:54:59,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.65915 samples/s/p 0:15:59 } +2024-07-30 05:55:02,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2448/ 3125], loss: 0.274, per_step_time: 1414ms, lr: 1.3615131e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:02,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.65743 samples/s/p 0:15:57 } +2024-07-30 05:55:05,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2450/ 3125], loss: 0.194, per_step_time: 1413ms, lr: 1.3535141e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:05,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.66051 samples/s/p 0:15:53 } +2024-07-30 05:55:08,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2452/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 1.345545e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:08,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.65966 samples/s/p 0:15:51 } +2024-07-30 05:55:11,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2454/ 3125], loss: 0.239, per_step_time: 1413ms, lr: 1.3375967e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:11,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.65853 samples/s/p 0:15:48 } +2024-07-30 05:55:14,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2456/ 3125], loss: 0.244, per_step_time: 1414ms, lr: 1.3296693e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:14,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.65724 samples/s/p 0:15:46 } +2024-07-30 05:55:16,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2458/ 3125], loss: 0.178, per_step_time: 1415ms, lr: 1.3217628e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:16,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.65219 samples/s/p 0:15:44 } +2024-07-30 05:55:19,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2460/ 3125], loss: 0.284, per_step_time: 1413ms, lr: 1.313889e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:19,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.66125 samples/s/p 0:15:39 } +2024-07-30 05:55:22,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2462/ 3125], loss: 0.099, per_step_time: 1413ms, lr: 1.3060301e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:22,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.66108 samples/s/p 0:15:36 } +2024-07-30 05:55:25,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2464/ 3125], loss: 0.348, per_step_time: 1413ms, lr: 1.2981981e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:25,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.66066 samples/s/p 0:15:34 } +2024-07-30 05:55:28,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2466/ 3125], loss: 0.240, per_step_time: 1414ms, lr: 1.290381e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:28,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.65750 samples/s/p 0:15:31 } +2024-07-30 05:55:31,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2468/ 3125], loss: 0.319, per_step_time: 1413ms, lr: 1.2825936e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:31,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.66095 samples/s/p 0:15:28 } +2024-07-30 05:55:33,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2470/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 1.274833e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:33,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.66021 samples/s/p 0:15:25 } +2024-07-30 05:55:36,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2472/ 3125], loss: 0.237, per_step_time: 1414ms, lr: 1.2670934e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:36,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.65517 samples/s/p 0:15:23 } +2024-07-30 05:55:39,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2474/ 3125], loss: 0.373, per_step_time: 1413ms, lr: 1.2593746e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:39,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.65946 samples/s/p 0:15:20 } +2024-07-30 05:55:42,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2476/ 3125], loss: 0.178, per_step_time: 1414ms, lr: 1.2516796e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:42,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.65722 samples/s/p 0:15:17 } +2024-07-30 05:55:45,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2478/ 3125], loss: 0.326, per_step_time: 1413ms, lr: 1.2440115e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:45,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.66037 samples/s/p 0:15:14 } +2024-07-30 05:55:48,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2480/ 3125], loss: 0.105, per_step_time: 1413ms, lr: 1.2363672e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:48,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.65843 samples/s/p 0:15:11 } +2024-07-30 05:55:50,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2482/ 3125], loss: 0.277, per_step_time: 1413ms, lr: 1.2287408e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:50,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.66161 samples/s/p 0:15:08 } +2024-07-30 05:55:53,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2484/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 1.2211382e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:53,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.65813 samples/s/p 0:15:06 } +2024-07-30 05:55:56,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2486/ 3125], loss: 0.445, per_step_time: 1413ms, lr: 1.2135625e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:56,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.65837 samples/s/p 0:15:03 } +2024-07-30 05:55:59,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2488/ 3125], loss: 0.332, per_step_time: 1412ms, lr: 1.2060076e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:55:59,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.66182 samples/s/p 0:15:00 } +2024-07-30 05:56:02,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2490/ 3125], loss: 0.244, per_step_time: 1413ms, lr: 1.1984795e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:02,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.66124 samples/s/p 0:14:57 } +2024-07-30 05:56:05,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2492/ 3125], loss: 0.110, per_step_time: 1413ms, lr: 1.1909723e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:05,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.66095 samples/s/p 0:14:54 } +2024-07-30 05:56:07,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2494/ 3125], loss: 0.096, per_step_time: 1413ms, lr: 1.18348595e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:07,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.65991 samples/s/p 0:14:51 } +2024-07-30 05:56:10,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2496/ 3125], loss: 0.230, per_step_time: 1413ms, lr: 1.1760235e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:10,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.65854 samples/s/p 0:14:49 } +2024-07-30 05:56:13,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2498/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 1.1685848e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:13,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.65928 samples/s/p 0:14:46 } +2024-07-30 05:56:16,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2500/ 3125], loss: 0.334, per_step_time: 1414ms, lr: 1.1611759e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:16,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.65660 samples/s/p 0:14:43 } +2024-07-30 05:56:19,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2502/ 3125], loss: 0.413, per_step_time: 1415ms, lr: 1.153782e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:19,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.65231 samples/s/p 0:14:41 } +2024-07-30 05:56:22,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2504/ 3125], loss: 0.376, per_step_time: 1413ms, lr: 1.14641786e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:22,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.66148 samples/s/p 0:14:37 } +2024-07-30 05:56:24,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2506/ 3125], loss: 0.242, per_step_time: 1412ms, lr: 1.13907156e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:24,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.66222 samples/s/p 0:14:34 } +2024-07-30 05:56:27,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2508/ 3125], loss: 0.164, per_step_time: 1413ms, lr: 1.1317521e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:27,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.66110 samples/s/p 0:14:31 } +2024-07-30 05:56:30,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2510/ 3125], loss: 0.126, per_step_time: 1413ms, lr: 1.1244505e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:30,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.66049 samples/s/p 0:14:29 } +2024-07-30 05:56:33,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2512/ 3125], loss: 0.341, per_step_time: 1414ms, lr: 1.11717874e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:33,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.65483 samples/s/p 0:14:27 } +2024-07-30 05:56:36,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2514/ 3125], loss: 0.190, per_step_time: 1413ms, lr: 1.1099249e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:36,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.65961 samples/s/p 0:14:23 } +2024-07-30 05:56:39,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2516/ 3125], loss: 0.254, per_step_time: 1414ms, lr: 1.1027008e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:39,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.65707 samples/s/p 0:14:21 } +2024-07-30 05:56:41,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2518/ 3125], loss: 0.192, per_step_time: 1415ms, lr: 1.0954946e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:41,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.65336 samples/s/p 0:14:18 } +2024-07-30 05:56:44,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2520/ 3125], loss: 0.403, per_step_time: 1413ms, lr: 1.0883152e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:44,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.66169 samples/s/p 0:14:14 } +2024-07-30 05:56:47,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2522/ 3125], loss: 0.298, per_step_time: 1413ms, lr: 1.0811567e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:47,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.65947 samples/s/p 0:14:12 } +2024-07-30 05:56:50,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2524/ 3125], loss: 0.348, per_step_time: 1412ms, lr: 1.074025e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:50,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.66173 samples/s/p 0:14:09 } +2024-07-30 05:56:53,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2526/ 3125], loss: 0.267, per_step_time: 1412ms, lr: 1.0669142e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:53,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.66193 samples/s/p 0:14:06 } +2024-07-30 05:56:56,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2528/ 3125], loss: 0.247, per_step_time: 1413ms, lr: 1.0598272e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:56,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.65799 samples/s/p 0:14:04 } +2024-07-30 05:56:58,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2530/ 3125], loss: 0.130, per_step_time: 1412ms, lr: 1.0527551e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:56:58,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.66221 samples/s/p 0:14:00 } +2024-07-30 05:57:01,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2532/ 3125], loss: 0.062, per_step_time: 1413ms, lr: 1.04571576e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:01,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.66142 samples/s/p 0:13:57 } +2024-07-30 05:57:04,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2534/ 3125], loss: 0.364, per_step_time: 1414ms, lr: 1.0387033e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:04,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.65444 samples/s/p 0:13:56 } +2024-07-30 05:57:07,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2536/ 3125], loss: 0.319, per_step_time: 1412ms, lr: 1.0317057e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:07,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.66173 samples/s/p 0:13:52 } +2024-07-30 05:57:10,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2538/ 3125], loss: 0.071, per_step_time: 1415ms, lr: 1.0247349e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:10,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.65199 samples/s/p 0:13:50 } +2024-07-30 05:57:13,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2540/ 3125], loss: 0.294, per_step_time: 1414ms, lr: 1.017788e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:13,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.65755 samples/s/p 0:13:47 } +2024-07-30 05:57:15,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2542/ 3125], loss: 0.164, per_step_time: 1414ms, lr: 1.0108679e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:15,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.65526 samples/s/p 0:13:44 } +2024-07-30 05:57:18,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2544/ 3125], loss: 0.389, per_step_time: 1414ms, lr: 1.0039687e-07, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:18,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.65723 samples/s/p 0:13:41 } +2024-07-30 05:57:21,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2546/ 3125], loss: 0.241, per_step_time: 1412ms, lr: 9.9709034e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:21,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.66312 samples/s/p 0:13:37 } +2024-07-30 05:57:24,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2548/ 3125], loss: 0.436, per_step_time: 1414ms, lr: 9.902358e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:24,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.65706 samples/s/p 0:13:35 } +2024-07-30 05:57:27,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2550/ 3125], loss: 0.187, per_step_time: 1412ms, lr: 9.834021e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:27,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.66245 samples/s/p 0:13:32 } +2024-07-30 05:57:30,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2552/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 9.765982e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:30,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.65803 samples/s/p 0:13:30 } +2024-07-30 05:57:32,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2554/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 9.6981225e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:32,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.66132 samples/s/p 0:13:26 } +2024-07-30 05:57:35,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2556/ 3125], loss: 0.270, per_step_time: 1413ms, lr: 9.630531e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:35,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.66095 samples/s/p 0:13:24 } +2024-07-30 05:57:38,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2558/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 9.5631776e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:38,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.65994 samples/s/p 0:13:21 } +2024-07-30 05:57:41,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2560/ 3125], loss: 0.161, per_step_time: 1413ms, lr: 9.4960626e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:41,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.66039 samples/s/p 0:13:18 } +2024-07-30 05:57:44,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2562/ 3125], loss: 0.318, per_step_time: 1425ms, lr: 9.429186e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:44,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.61137 samples/s/p 0:13:22 } +2024-07-30 05:57:47,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2564/ 3125], loss: 0.187, per_step_time: 1413ms, lr: 9.362459e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:47,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |███████████████████████████████████████████████ | 5.65883 samples/s/p 0:13:13 } +2024-07-30 05:57:49,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2566/ 3125], loss: 0.332, per_step_time: 1413ms, lr: 9.29603e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:49,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |███████████████████████████████████████████████ | 5.66055 samples/s/p 0:13:10 } +2024-07-30 05:57:52,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2568/ 3125], loss: 0.229, per_step_time: 1414ms, lr: 9.2298386e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:52,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.65578 samples/s/p 0:13:07 } +2024-07-30 05:57:55,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2570/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 9.163886e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:55,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.66105 samples/s/p 0:13:04 } +2024-07-30 05:57:58,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2572/ 3125], loss: 0.212, per_step_time: 1414ms, lr: 9.098202e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:57:58,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.65548 samples/s/p 0:13:02 } +2024-07-30 05:58:01,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2574/ 3125], loss: 0.321, per_step_time: 1413ms, lr: 9.032637e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:01,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.65819 samples/s/p 0:12:59 } +2024-07-30 05:58:04,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2576/ 3125], loss: 0.447, per_step_time: 1413ms, lr: 8.9674295e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:04,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.65920 samples/s/p 0:12:56 } +2024-07-30 05:58:06,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2578/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 8.9024006e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:06,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.66080 samples/s/p 0:12:53 } +2024-07-30 05:58:09,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2580/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 8.83764e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:09,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.66075 samples/s/p 0:12:50 } +2024-07-30 05:58:12,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2582/ 3125], loss: 0.219, per_step_time: 1413ms, lr: 8.7730584e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:12,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.65836 samples/s/p 0:12:47 } +2024-07-30 05:58:15,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2584/ 3125], loss: 0.226, per_step_time: 1414ms, lr: 8.708715e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:15,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.65666 samples/s/p 0:12:45 } +2024-07-30 05:58:18,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2586/ 3125], loss: 0.261, per_step_time: 1413ms, lr: 8.64467e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:18,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.66098 samples/s/p 0:12:41 } +2024-07-30 05:58:21,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2588/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 8.580774e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:21,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.65972 samples/s/p 0:12:39 } +2024-07-30 05:58:23,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2590/ 3125], loss: 0.333, per_step_time: 1413ms, lr: 8.5171756e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:23,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.65934 samples/s/p 0:12:36 } +2024-07-30 05:58:26,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2592/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 8.453816e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:26,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.66048 samples/s/p 0:12:33 } +2024-07-30 05:58:29,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2594/ 3125], loss: 0.322, per_step_time: 1413ms, lr: 8.390635e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:29,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.65815 samples/s/p 0:12:30 } +2024-07-30 05:58:32,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2596/ 3125], loss: 0.275, per_step_time: 1414ms, lr: 8.327722e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:32,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.65552 samples/s/p 0:12:28 } +2024-07-30 05:58:35,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2598/ 3125], loss: 0.081, per_step_time: 1414ms, lr: 8.265048e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:35,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.65724 samples/s/p 0:12:25 } +2024-07-30 05:58:38,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2600/ 3125], loss: 0.168, per_step_time: 1413ms, lr: 8.202642e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:38,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.66141 samples/s/p 0:12:21 } +2024-07-30 05:58:40,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2602/ 3125], loss: 0.213, per_step_time: 1413ms, lr: 8.1404444e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:40,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.66000 samples/s/p 0:12:19 } +2024-07-30 05:58:43,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2604/ 3125], loss: 0.317, per_step_time: 1412ms, lr: 8.078426e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:43,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.66258 samples/s/p 0:12:16 } +2024-07-30 05:58:46,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2606/ 3125], loss: 0.304, per_step_time: 1412ms, lr: 8.0167055e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:46,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.66238 samples/s/p 0:12:13 } +2024-07-30 05:58:49,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2608/ 3125], loss: 0.178, per_step_time: 1414ms, lr: 7.955163e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:49,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.65708 samples/s/p 0:12:11 } +2024-07-30 05:58:52,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2610/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 7.893949e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:52,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.66157 samples/s/p 0:12:07 } +2024-07-30 05:58:55,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2612/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 7.8329144e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:55,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.66008 samples/s/p 0:12:05 } +2024-07-30 05:58:57,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2614/ 3125], loss: 0.163, per_step_time: 1413ms, lr: 7.7721474e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:58:57,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.66134 samples/s/p 0:12:02 } +2024-07-30 05:59:00,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2616/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 7.7115295e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:00,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.66125 samples/s/p 0:11:59 } +2024-07-30 05:59:03,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2618/ 3125], loss: 0.287, per_step_time: 1413ms, lr: 7.6512094e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:03,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.66025 samples/s/p 0:11:56 } +2024-07-30 05:59:06,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2620/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 7.591128e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:06,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.65868 samples/s/p 0:11:53 } +2024-07-30 05:59:09,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2622/ 3125], loss: 0.276, per_step_time: 1413ms, lr: 7.5312556e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:09,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.66029 samples/s/p 0:11:50 } +2024-07-30 05:59:12,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2624/ 3125], loss: 0.343, per_step_time: 1425ms, lr: 7.47165e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:12,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.61262 samples/s/p 0:11:54 } +2024-07-30 05:59:14,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2626/ 3125], loss: 0.095, per_step_time: 1413ms, lr: 7.4122546e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:14,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.65789 samples/s/p 0:11:45 } +2024-07-30 05:59:17,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2628/ 3125], loss: 0.128, per_step_time: 1415ms, lr: 7.353127e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:17,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.65232 samples/s/p 0:11:43 } +2024-07-30 05:59:20,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2630/ 3125], loss: 0.312, per_step_time: 1412ms, lr: 7.294178e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:20,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.66176 samples/s/p 0:11:39 } +2024-07-30 05:59:23,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2632/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 7.235497e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:23,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.66110 samples/s/p 0:11:36 } +2024-07-30 05:59:26,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2634/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 7.177055e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:26,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.65906 samples/s/p 0:11:34 } +2024-07-30 05:59:29,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2636/ 3125], loss: 0.153, per_step_time: 1413ms, lr: 7.118821e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:29,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.65950 samples/s/p 0:11:31 } +2024-07-30 05:59:31,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2638/ 3125], loss: 0.309, per_step_time: 1414ms, lr: 7.0609154e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:31,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.65749 samples/s/p 0:11:28 } +2024-07-30 05:59:34,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2640/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 7.003158e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:34,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.65853 samples/s/p 0:11:25 } +2024-07-30 05:59:37,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2642/ 3125], loss: 0.435, per_step_time: 1415ms, lr: 6.94561e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:37,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.65324 samples/s/p 0:11:23 } +2024-07-30 05:59:40,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2644/ 3125], loss: 0.196, per_step_time: 1413ms, lr: 6.8883594e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:40,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.65810 samples/s/p 0:11:20 } +2024-07-30 05:59:43,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2646/ 3125], loss: 0.293, per_step_time: 1412ms, lr: 6.831318e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:43,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.66219 samples/s/p 0:11:16 } +2024-07-30 05:59:46,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2648/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 6.774515e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:46,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.66005 samples/s/p 0:11:14 } +2024-07-30 05:59:48,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2650/ 3125], loss: 0.221, per_step_time: 1412ms, lr: 6.71792e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:48,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.66240 samples/s/p 0:11:11 } +2024-07-30 05:59:51,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2652/ 3125], loss: 0.039, per_step_time: 1413ms, lr: 6.661624e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:51,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.66019 samples/s/p 0:11:08 } +2024-07-30 05:59:54,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2654/ 3125], loss: 0.388, per_step_time: 1416ms, lr: 6.605536e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:54,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.64734 samples/s/p 0:11:07 } +2024-07-30 05:59:57,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2656/ 3125], loss: 0.434, per_step_time: 1413ms, lr: 6.549686e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 05:59:57,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.66050 samples/s/p 0:11:02 } +2024-07-30 06:00:00,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2658/ 3125], loss: 0.437, per_step_time: 1414ms, lr: 6.494045e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:00,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.65408 samples/s/p 0:11:00 } +2024-07-30 06:00:03,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2660/ 3125], loss: 0.326, per_step_time: 1412ms, lr: 6.4386725e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:03,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.66180 samples/s/p 0:10:57 } +2024-07-30 06:00:05,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2662/ 3125], loss: 0.280, per_step_time: 1413ms, lr: 6.383538e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:05,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.65997 samples/s/p 0:10:54 } +2024-07-30 06:00:08,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2664/ 3125], loss: 0.132, per_step_time: 1413ms, lr: 6.328612e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:08,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.65901 samples/s/p 0:10:51 } +2024-07-30 06:00:11,659 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2666/ 3125], loss: 0.284, per_step_time: 1412ms, lr: 6.273955e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:11,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.66181 samples/s/p 0:10:48 } +2024-07-30 06:00:14,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2668/ 3125], loss: 0.143, per_step_time: 1413ms, lr: 6.2194765e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:14,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.66011 samples/s/p 0:10:45 } +2024-07-30 06:00:17,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2670/ 3125], loss: 0.177, per_step_time: 1412ms, lr: 6.1652656e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:17,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.66175 samples/s/p 0:10:42 } +2024-07-30 06:00:20,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2672/ 3125], loss: 0.228, per_step_time: 1413ms, lr: 6.111294e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:20,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.65827 samples/s/p 0:10:40 } +2024-07-30 06:00:22,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2674/ 3125], loss: 0.306, per_step_time: 1412ms, lr: 6.05759e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:22,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.66223 samples/s/p 0:10:37 } +2024-07-30 06:00:25,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2676/ 3125], loss: 0.108, per_step_time: 1413ms, lr: 6.0041245e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:25,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.66027 samples/s/p 0:10:34 } +2024-07-30 06:00:28,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2678/ 3125], loss: 0.241, per_step_time: 1413ms, lr: 5.950838e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:28,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.65853 samples/s/p 0:10:31 } +2024-07-30 06:00:31,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2680/ 3125], loss: 0.439, per_step_time: 1413ms, lr: 5.89779e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:31,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.66072 samples/s/p 0:10:28 } +2024-07-30 06:00:34,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2682/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 5.8449803e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:34,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.65908 samples/s/p 0:10:26 } +2024-07-30 06:00:37,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2684/ 3125], loss: 0.422, per_step_time: 1414ms, lr: 5.792439e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:37,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.65656 samples/s/p 0:10:23 } +2024-07-30 06:00:39,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2686/ 3125], loss: 0.234, per_step_time: 1412ms, lr: 5.7401657e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:39,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.66179 samples/s/p 0:10:20 } +2024-07-30 06:00:42,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2688/ 3125], loss: 0.657, per_step_time: 1413ms, lr: 5.6880115e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:42,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.65943 samples/s/p 0:10:17 } +2024-07-30 06:00:45,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2690/ 3125], loss: 0.300, per_step_time: 1413ms, lr: 5.6361852e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:45,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.65921 samples/s/p 0:10:14 } +2024-07-30 06:00:48,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2692/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 5.5845973e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:48,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.65823 samples/s/p 0:10:12 } +2024-07-30 06:00:51,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2694/ 3125], loss: 0.072, per_step_time: 1414ms, lr: 5.5332183e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:51,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.65410 samples/s/p 0:10:09 } +2024-07-30 06:00:54,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2696/ 3125], loss: 0.481, per_step_time: 1414ms, lr: 5.4820475e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:54,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.65390 samples/s/p 0:10:07 } +2024-07-30 06:00:57,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2698/ 3125], loss: 0.191, per_step_time: 1413ms, lr: 5.4311453e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:57,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.66100 samples/s/p 0:10:03 } +2024-07-30 06:00:59,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2700/ 3125], loss: 0.306, per_step_time: 1413ms, lr: 5.3805113e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:00:59,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.66114 samples/s/p 0:10:00 } +2024-07-30 06:01:02,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2702/ 3125], loss: 0.315, per_step_time: 1413ms, lr: 5.3300855e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:02,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.65935 samples/s/p 0:09:57 } +2024-07-30 06:01:05,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2704/ 3125], loss: 0.296, per_step_time: 1413ms, lr: 5.2798686e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:05,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.65925 samples/s/p 0:09:55 } +2024-07-30 06:01:08,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2706/ 3125], loss: 0.211, per_step_time: 1413ms, lr: 5.22992e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:08,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.66156 samples/s/p 0:09:52 } +2024-07-30 06:01:11,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2708/ 3125], loss: 0.297, per_step_time: 1414ms, lr: 5.1802097e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:11,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.65648 samples/s/p 0:09:49 } +2024-07-30 06:01:14,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2710/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 5.1307378e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:14,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.65955 samples/s/p 0:09:46 } +2024-07-30 06:01:16,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2712/ 3125], loss: 0.024, per_step_time: 1413ms, lr: 5.081445e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:16,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.65784 samples/s/p 0:09:43 } +2024-07-30 06:01:19,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2714/ 3125], loss: 0.197, per_step_time: 1414ms, lr: 5.03242e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:19,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.65443 samples/s/p 0:09:41 } +2024-07-30 06:01:22,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2716/ 3125], loss: 0.221, per_step_time: 1413ms, lr: 4.9836633e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:22,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.65860 samples/s/p 0:09:38 } +2024-07-30 06:01:25,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2718/ 3125], loss: 0.164, per_step_time: 1414ms, lr: 4.9351453e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:25,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.65620 samples/s/p 0:09:35 } +2024-07-30 06:01:28,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2720/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 4.886836e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:28,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.66001 samples/s/p 0:09:32 } +2024-07-30 06:01:31,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2722/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 4.8387644e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:31,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.65878 samples/s/p 0:09:29 } +2024-07-30 06:01:33,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2724/ 3125], loss: 0.248, per_step_time: 1413ms, lr: 4.790902e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:33,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.65939 samples/s/p 0:09:26 } +2024-07-30 06:01:36,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2726/ 3125], loss: 0.329, per_step_time: 1413ms, lr: 4.7433375e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:36,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.66151 samples/s/p 0:09:23 } +2024-07-30 06:01:39,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2728/ 3125], loss: 0.289, per_step_time: 1413ms, lr: 4.6959517e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:39,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.65838 samples/s/p 0:09:21 } +2024-07-30 06:01:42,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2730/ 3125], loss: 0.318, per_step_time: 1413ms, lr: 4.6488342e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:42,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.66045 samples/s/p 0:09:18 } +2024-07-30 06:01:45,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2732/ 3125], loss: 0.372, per_step_time: 1413ms, lr: 4.601985e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:45,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.65922 samples/s/p 0:09:15 } +2024-07-30 06:01:48,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2734/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 4.5553147e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:48,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.66041 samples/s/p 0:09:12 } +2024-07-30 06:01:50,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2736/ 3125], loss: 0.227, per_step_time: 1413ms, lr: 4.5088825e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:50,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.65985 samples/s/p 0:09:09 } +2024-07-30 06:01:53,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2738/ 3125], loss: 0.397, per_step_time: 1413ms, lr: 4.462689e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:53,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.66064 samples/s/p 0:09:06 } +2024-07-30 06:01:56,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2740/ 3125], loss: 0.361, per_step_time: 1413ms, lr: 4.416764e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:56,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.66117 samples/s/p 0:09:04 } +2024-07-30 06:01:59,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2742/ 3125], loss: 0.231, per_step_time: 1413ms, lr: 4.3710767e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:01:59,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.66003 samples/s/p 0:09:01 } +2024-07-30 06:02:02,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2744/ 3125], loss: 0.386, per_step_time: 1413ms, lr: 4.3255984e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:02,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.65846 samples/s/p 0:08:58 } +2024-07-30 06:02:05,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2746/ 3125], loss: 0.068, per_step_time: 1412ms, lr: 4.2803883e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:05,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |███████████████████████████████████████████████ | 5.66290 samples/s/p 0:08:55 } +2024-07-30 06:02:07,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2748/ 3125], loss: 0.357, per_step_time: 1414ms, lr: 4.2353868e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:07,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |███████████████████████████████████████████████ | 5.65710 samples/s/p 0:08:53 } +2024-07-30 06:02:10,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2750/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 4.1906535e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:10,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.65958 samples/s/p 0:08:50 } +2024-07-30 06:02:13,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2752/ 3125], loss: 0.364, per_step_time: 1415ms, lr: 4.1461288e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:13,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.65276 samples/s/p 0:08:47 } +2024-07-30 06:02:16,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2754/ 3125], loss: 0.232, per_step_time: 1413ms, lr: 4.1018424e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:16,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.66043 samples/s/p 0:08:44 } +2024-07-30 06:02:19,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2756/ 3125], loss: 0.309, per_step_time: 1414ms, lr: 4.0577948e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:19,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.65390 samples/s/p 0:08:42 } +2024-07-30 06:02:22,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2758/ 3125], loss: 0.245, per_step_time: 1413ms, lr: 4.014015e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:22,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.66156 samples/s/p 0:08:38 } +2024-07-30 06:02:24,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2760/ 3125], loss: 0.477, per_step_time: 1414ms, lr: 3.9704442e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:24,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.65694 samples/s/p 0:08:36 } +2024-07-30 06:02:27,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2762/ 3125], loss: 0.205, per_step_time: 1413ms, lr: 3.9270518e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:27,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.66016 samples/s/p 0:08:33 } +2024-07-30 06:02:30,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2764/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 3.8839875e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:30,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.66122 samples/s/p 0:08:30 } +2024-07-30 06:02:33,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2766/ 3125], loss: 0.214, per_step_time: 1412ms, lr: 3.841102e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:33,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.66210 samples/s/p 0:08:27 } +2024-07-30 06:02:36,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2768/ 3125], loss: 0.448, per_step_time: 1413ms, lr: 3.7985146e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:36,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.66018 samples/s/p 0:08:24 } +2024-07-30 06:02:39,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2770/ 3125], loss: 0.237, per_step_time: 1412ms, lr: 3.7561357e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:39,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.66286 samples/s/p 0:08:21 } +2024-07-30 06:02:41,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2772/ 3125], loss: 0.273, per_step_time: 1413ms, lr: 3.7139653e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:41,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.66095 samples/s/p 0:08:18 } +2024-07-30 06:02:44,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2774/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 3.6720333e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:44,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.66143 samples/s/p 0:08:15 } +2024-07-30 06:02:47,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2776/ 3125], loss: 0.407, per_step_time: 1412ms, lr: 3.63034e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:47,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.66267 samples/s/p 0:08:13 } +2024-07-30 06:02:50,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2778/ 3125], loss: 0.339, per_step_time: 1413ms, lr: 3.5889446e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:50,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.66039 samples/s/p 0:08:10 } +2024-07-30 06:02:53,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2780/ 3125], loss: 0.166, per_step_time: 1412ms, lr: 3.5476685e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:53,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.66302 samples/s/p 0:08:07 } +2024-07-30 06:02:56,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2782/ 3125], loss: 0.459, per_step_time: 1414ms, lr: 3.5067497e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:56,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.65693 samples/s/p 0:08:05 } +2024-07-30 06:02:58,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2784/ 3125], loss: 0.311, per_step_time: 1416ms, lr: 3.46601e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:02:58,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.64966 samples/s/p 0:08:02 } +2024-07-30 06:03:01,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2786/ 3125], loss: 0.355, per_step_time: 1413ms, lr: 3.4255386e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:01,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.65996 samples/s/p 0:07:59 } +2024-07-30 06:03:04,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2788/ 3125], loss: 0.211, per_step_time: 1414ms, lr: 3.3852753e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:04,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.65734 samples/s/p 0:07:56 } +2024-07-30 06:03:07,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2790/ 3125], loss: 0.353, per_step_time: 1414ms, lr: 3.3452807e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:07,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.65745 samples/s/p 0:07:53 } +2024-07-30 06:03:10,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2792/ 3125], loss: 0.171, per_step_time: 1414ms, lr: 3.3054945e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:10,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.65692 samples/s/p 0:07:50 } +2024-07-30 06:03:13,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2794/ 3125], loss: 0.343, per_step_time: 1413ms, lr: 3.265947e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:13,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.65996 samples/s/p 0:07:47 } +2024-07-30 06:03:15,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2796/ 3125], loss: 0.270, per_step_time: 1414ms, lr: 3.226608e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:15,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.65475 samples/s/p 0:07:45 } +2024-07-30 06:03:18,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2798/ 3125], loss: 0.333, per_step_time: 1414ms, lr: 3.187567e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:18,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.65712 samples/s/p 0:07:42 } +2024-07-30 06:03:21,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2800/ 3125], loss: 0.323, per_step_time: 1413ms, lr: 3.1487644e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:21,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.65833 samples/s/p 0:07:39 } +2024-07-30 06:03:24,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2802/ 3125], loss: 0.151, per_step_time: 1414ms, lr: 3.1101703e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:24,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.65707 samples/s/p 0:07:36 } +2024-07-30 06:03:27,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2804/ 3125], loss: 0.325, per_step_time: 1413ms, lr: 3.071755e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:27,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.66034 samples/s/p 0:07:33 } +2024-07-30 06:03:30,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2806/ 3125], loss: 0.184, per_step_time: 1413ms, lr: 3.033668e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:30,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.65964 samples/s/p 0:07:30 } +2024-07-30 06:03:32,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2808/ 3125], loss: 0.221, per_step_time: 1414ms, lr: 2.995759e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:32,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.65698 samples/s/p 0:07:28 } +2024-07-30 06:03:35,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2810/ 3125], loss: 0.115, per_step_time: 1412ms, lr: 2.9581486e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:35,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.66200 samples/s/p 0:07:25 } +2024-07-30 06:03:38,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2812/ 3125], loss: 0.130, per_step_time: 1413ms, lr: 2.920717e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:38,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.66084 samples/s/p 0:07:22 } +2024-07-30 06:03:41,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2814/ 3125], loss: 0.147, per_step_time: 1413ms, lr: 2.8835236e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:41,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.66162 samples/s/p 0:07:19 } +2024-07-30 06:03:44,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2816/ 3125], loss: 0.315, per_step_time: 1412ms, lr: 2.8466582e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:44,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.66205 samples/s/p 0:07:16 } +2024-07-30 06:03:47,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2818/ 3125], loss: 0.370, per_step_time: 1413ms, lr: 2.8099416e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:47,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.66006 samples/s/p 0:07:13 } +2024-07-30 06:03:49,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2820/ 3125], loss: 0.441, per_step_time: 1412ms, lr: 2.773434e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:49,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.66220 samples/s/p 0:07:10 } +2024-07-30 06:03:52,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2822/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 2.7372538e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:52,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.65867 samples/s/p 0:07:08 } +2024-07-30 06:03:55,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2824/ 3125], loss: 0.347, per_step_time: 1413ms, lr: 2.7012526e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:55,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.66049 samples/s/p 0:07:05 } +2024-07-30 06:03:58,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2826/ 3125], loss: 0.407, per_step_time: 1413ms, lr: 2.6655197e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:03:58,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.65949 samples/s/p 0:07:02 } +2024-07-30 06:04:01,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2828/ 3125], loss: 0.230, per_step_time: 1415ms, lr: 2.6299952e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:01,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.65307 samples/s/p 0:07:00 } +2024-07-30 06:04:04,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2830/ 3125], loss: 0.183, per_step_time: 1413ms, lr: 2.5947392e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:04,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.66151 samples/s/p 0:06:56 } +2024-07-30 06:04:06,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2832/ 3125], loss: 0.297, per_step_time: 1413ms, lr: 2.5597213e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:06,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.66081 samples/s/p 0:06:54 } +2024-07-30 06:04:09,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2834/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 2.5248527e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:09,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.66107 samples/s/p 0:06:51 } +2024-07-30 06:04:12,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2836/ 3125], loss: 0.271, per_step_time: 1414ms, lr: 2.4903715e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:12,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.65770 samples/s/p 0:06:48 } +2024-07-30 06:04:15,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2838/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 2.4560093e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:15,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.65919 samples/s/p 0:06:45 } +2024-07-30 06:04:18,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2840/ 3125], loss: 0.247, per_step_time: 1414ms, lr: 2.4219453e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:18,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.65650 samples/s/p 0:06:43 } +2024-07-30 06:04:21,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2842/ 3125], loss: 0.265, per_step_time: 1413ms, lr: 2.3881196e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:21,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.65941 samples/s/p 0:06:40 } +2024-07-30 06:04:23,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2844/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 2.3544729e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:23,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.66024 samples/s/p 0:06:37 } +2024-07-30 06:04:26,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2846/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 2.3211241e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:26,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.66024 samples/s/p 0:06:34 } +2024-07-30 06:04:29,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2848/ 3125], loss: 0.345, per_step_time: 1414ms, lr: 2.2880137e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:29,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.65752 samples/s/p 0:06:31 } +2024-07-30 06:04:32,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2850/ 3125], loss: 0.404, per_step_time: 1413ms, lr: 2.255082e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:32,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.66047 samples/s/p 0:06:28 } +2024-07-30 06:04:35,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2852/ 3125], loss: 0.128, per_step_time: 1413ms, lr: 2.2224187e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:35,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.65785 samples/s/p 0:06:26 } +2024-07-30 06:04:38,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2854/ 3125], loss: 0.231, per_step_time: 1414ms, lr: 2.1899938e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:38,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.65527 samples/s/p 0:06:23 } +2024-07-30 06:04:40,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2856/ 3125], loss: 0.252, per_step_time: 1413ms, lr: 2.1578073e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:40,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.66042 samples/s/p 0:06:20 } +2024-07-30 06:04:43,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2858/ 3125], loss: 0.124, per_step_time: 1414ms, lr: 2.125889e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:43,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.65568 samples/s/p 0:06:17 } +2024-07-30 06:04:46,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2860/ 3125], loss: 0.263, per_step_time: 1414ms, lr: 2.0941794e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:46,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.65726 samples/s/p 0:06:14 } +2024-07-30 06:04:49,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2862/ 3125], loss: 0.336, per_step_time: 1413ms, lr: 2.0627379e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:49,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.65952 samples/s/p 0:06:11 } +2024-07-30 06:04:52,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2864/ 3125], loss: 0.192, per_step_time: 1419ms, lr: 2.0314753e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:52,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.63497 samples/s/p 0:06:10 } +2024-07-30 06:04:55,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2866/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 2.0005107e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:55,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.65830 samples/s/p 0:06:06 } +2024-07-30 06:04:57,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2868/ 3125], loss: 0.290, per_step_time: 1414ms, lr: 1.9697248e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:04:57,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.65719 samples/s/p 0:06:03 } +2024-07-30 06:05:00,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2870/ 3125], loss: 0.354, per_step_time: 1413ms, lr: 1.9392072e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:00,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.66052 samples/s/p 0:06:00 } +2024-07-30 06:05:03,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2872/ 3125], loss: 0.149, per_step_time: 1413ms, lr: 1.908958e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:03,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.65935 samples/s/p 0:05:57 } +2024-07-30 06:05:06,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2874/ 3125], loss: 0.262, per_step_time: 1413ms, lr: 1.8788874e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:06,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.66058 samples/s/p 0:05:54 } +2024-07-30 06:05:09,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2876/ 3125], loss: 0.313, per_step_time: 1413ms, lr: 1.849085e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:09,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.66012 samples/s/p 0:05:51 } +2024-07-30 06:05:12,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2878/ 3125], loss: 0.268, per_step_time: 1413ms, lr: 1.819521e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:12,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.65785 samples/s/p 0:05:49 } +2024-07-30 06:05:14,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2880/ 3125], loss: 0.092, per_step_time: 1412ms, lr: 1.7902254e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:14,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.66171 samples/s/p 0:05:46 } +2024-07-30 06:05:17,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2882/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 1.7611086e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:17,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.66032 samples/s/p 0:05:43 } +2024-07-30 06:05:20,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2884/ 3125], loss: 0.282, per_step_time: 1413ms, lr: 1.73226e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:20,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.66052 samples/s/p 0:05:40 } +2024-07-30 06:05:23,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2886/ 3125], loss: 0.269, per_step_time: 1413ms, lr: 1.7036497e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:23,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.65977 samples/s/p 0:05:37 } +2024-07-30 06:05:26,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2888/ 3125], loss: 0.341, per_step_time: 1414ms, lr: 1.6752184e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:26,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.65636 samples/s/p 0:05:35 } +2024-07-30 06:05:29,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2890/ 3125], loss: 0.144, per_step_time: 1413ms, lr: 1.6471148e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:29,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.66097 samples/s/p 0:05:32 } +2024-07-30 06:05:31,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2892/ 3125], loss: 0.404, per_step_time: 1414ms, lr: 1.6192198e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:31,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.65705 samples/s/p 0:05:29 } +2024-07-30 06:05:34,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2894/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 1.5915631e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:34,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.66148 samples/s/p 0:05:26 } +2024-07-30 06:05:37,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2896/ 3125], loss: 0.167, per_step_time: 1415ms, lr: 1.5641152e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:37,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.65278 samples/s/p 0:05:24 } +2024-07-30 06:05:40,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2898/ 3125], loss: 0.374, per_step_time: 1413ms, lr: 1.5369654e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:40,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.66138 samples/s/p 0:05:20 } +2024-07-30 06:05:43,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2900/ 3125], loss: 0.129, per_step_time: 1413ms, lr: 1.5099644e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:43,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.65895 samples/s/p 0:05:18 } +2024-07-30 06:05:46,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2902/ 3125], loss: 0.152, per_step_time: 1413ms, lr: 1.4832615e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:46,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.66053 samples/s/p 0:05:15 } +2024-07-30 06:05:48,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2904/ 3125], loss: 0.422, per_step_time: 1413ms, lr: 1.4568269e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:48,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.65910 samples/s/p 0:05:12 } +2024-07-30 06:05:51,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2906/ 3125], loss: 0.186, per_step_time: 1414ms, lr: 1.4305412e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:51,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.65746 samples/s/p 0:05:09 } +2024-07-30 06:05:54,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2908/ 3125], loss: 0.381, per_step_time: 1414ms, lr: 1.4045536e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:54,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.65652 samples/s/p 0:05:06 } +2024-07-30 06:05:57,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2910/ 3125], loss: 0.063, per_step_time: 1413ms, lr: 1.3787746e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:05:57,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.65790 samples/s/p 0:05:03 } +2024-07-30 06:06:00,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2912/ 3125], loss: 0.152, per_step_time: 1424ms, lr: 1.35329365e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:00,310 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.61565 samples/s/p 0:05:03 } +2024-07-30 06:06:03,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2914/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 1.3279915e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:03,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.66086 samples/s/p 0:04:58 } +2024-07-30 06:06:05,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2916/ 3125], loss: 0.215, per_step_time: 1413ms, lr: 1.3029575e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:05,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.66029 samples/s/p 0:04:55 } +2024-07-30 06:06:08,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2918/ 3125], loss: 0.290, per_step_time: 1415ms, lr: 1.2781322e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:08,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.65150 samples/s/p 0:04:53 } +2024-07-30 06:06:11,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2920/ 3125], loss: 0.135, per_step_time: 1420ms, lr: 1.253575e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:11,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.63368 samples/s/p 0:04:51 } +2024-07-30 06:06:14,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2922/ 3125], loss: 0.302, per_step_time: 1413ms, lr: 1.2292862e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:14,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.65869 samples/s/p 0:04:46 } +2024-07-30 06:06:17,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2924/ 3125], loss: 0.181, per_step_time: 1413ms, lr: 1.20517605e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:17,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.65941 samples/s/p 0:04:44 } +2024-07-30 06:06:20,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2926/ 3125], loss: 0.231, per_step_time: 1415ms, lr: 1.1813044e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:20,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.65209 samples/s/p 0:04:41 } +2024-07-30 06:06:23,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2928/ 3125], loss: 0.131, per_step_time: 1413ms, lr: 1.1576712e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:23,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.65771 samples/s/p 0:04:38 } +2024-07-30 06:06:25,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2930/ 3125], loss: 0.466, per_step_time: 1413ms, lr: 1.1342763e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:25,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.66076 samples/s/p 0:04:35 } +2024-07-30 06:06:28,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2932/ 3125], loss: 0.193, per_step_time: 1413ms, lr: 1.1111796e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:28,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.66044 samples/s/p 0:04:32 } +2024-07-30 06:06:31,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2934/ 3125], loss: 0.259, per_step_time: 1413ms, lr: 1.0882616e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:31,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |████████████████████████████████████████████████ | 5.65829 samples/s/p 0:04:30 } +2024-07-30 06:06:34,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2936/ 3125], loss: 0.182, per_step_time: 1413ms, lr: 1.0656118e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:34,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |████████████████████████████████████████████████ | 5.65892 samples/s/p 0:04:27 } +2024-07-30 06:06:37,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2938/ 3125], loss: 0.155, per_step_time: 1413ms, lr: 1.0431707e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:37,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.65963 samples/s/p 0:04:24 } +2024-07-30 06:06:40,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2940/ 3125], loss: 0.265, per_step_time: 1412ms, lr: 1.0209978e-08, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:40,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.66172 samples/s/p 0:04:21 } +2024-07-30 06:06:42,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2942/ 3125], loss: 0.220, per_step_time: 1414ms, lr: 9.990334e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:42,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.65581 samples/s/p 0:04:18 } +2024-07-30 06:06:45,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2944/ 3125], loss: 0.210, per_step_time: 1413ms, lr: 9.773076e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:45,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.65872 samples/s/p 0:04:15 } +2024-07-30 06:06:48,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2946/ 3125], loss: 0.314, per_step_time: 1413ms, lr: 9.558499e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:48,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.65864 samples/s/p 0:04:13 } +2024-07-30 06:06:51,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2948/ 3125], loss: 0.209, per_step_time: 1414ms, lr: 9.346604e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:51,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.65507 samples/s/p 0:04:10 } +2024-07-30 06:06:54,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2950/ 3125], loss: 0.284, per_step_time: 1412ms, lr: 9.136498e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:54,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.66249 samples/s/p 0:04:07 } +2024-07-30 06:06:57,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2952/ 3125], loss: 0.452, per_step_time: 1413ms, lr: 8.9284775e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:57,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.65795 samples/s/p 0:04:04 } +2024-07-30 06:06:59,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2954/ 3125], loss: 0.337, per_step_time: 1414ms, lr: 8.723438e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:06:59,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.65716 samples/s/p 0:04:01 } +2024-07-30 06:07:02,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2956/ 3125], loss: 0.389, per_step_time: 1413ms, lr: 8.520781e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:02,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.65918 samples/s/p 0:03:58 } +2024-07-30 06:07:05,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2958/ 3125], loss: 0.130, per_step_time: 1414ms, lr: 8.320212e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:05,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.65579 samples/s/p 0:03:56 } +2024-07-30 06:07:08,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2960/ 3125], loss: 0.097, per_step_time: 1414ms, lr: 8.122623e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:08,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.65431 samples/s/p 0:03:53 } +2024-07-30 06:07:11,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2962/ 3125], loss: 0.430, per_step_time: 1413ms, lr: 7.926523e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:11,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.66095 samples/s/p 0:03:50 } +2024-07-30 06:07:14,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2964/ 3125], loss: 0.220, per_step_time: 1412ms, lr: 7.733404e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:14,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.66188 samples/s/p 0:03:47 } +2024-07-30 06:07:16,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2966/ 3125], loss: 0.223, per_step_time: 1413ms, lr: 7.542371e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:16,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.66170 samples/s/p 0:03:44 } +2024-07-30 06:07:19,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2968/ 3125], loss: 0.192, per_step_time: 1413ms, lr: 7.354021e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:19,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.65951 samples/s/p 0:03:41 } +2024-07-30 06:07:22,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2970/ 3125], loss: 0.252, per_step_time: 1414ms, lr: 7.167458e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:22,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.65743 samples/s/p 0:03:39 } +2024-07-30 06:07:25,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2972/ 3125], loss: 0.431, per_step_time: 1414ms, lr: 6.983876e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:25,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.65651 samples/s/p 0:03:36 } +2024-07-30 06:07:28,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2974/ 3125], loss: 0.202, per_step_time: 1413ms, lr: 6.802976e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:28,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.66050 samples/s/p 0:03:33 } +2024-07-30 06:07:31,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2976/ 3125], loss: 0.305, per_step_time: 1413ms, lr: 6.623864e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:31,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.65970 samples/s/p 0:03:30 } +2024-07-30 06:07:33,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2978/ 3125], loss: 0.216, per_step_time: 1413ms, lr: 6.447136e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:33,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.65886 samples/s/p 0:03:27 } +2024-07-30 06:07:36,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2980/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 6.2727925e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:36,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.66101 samples/s/p 0:03:24 } +2024-07-30 06:07:39,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2982/ 3125], loss: 0.104, per_step_time: 1413ms, lr: 6.101131e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:39,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.66074 samples/s/p 0:03:22 } +2024-07-30 06:07:42,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2984/ 3125], loss: 0.242, per_step_time: 1413ms, lr: 5.931854e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:42,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.65965 samples/s/p 0:03:19 } +2024-07-30 06:07:45,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2986/ 3125], loss: 0.175, per_step_time: 1413ms, lr: 5.764663e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:45,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.66132 samples/s/p 0:03:16 } +2024-07-30 06:07:48,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2988/ 3125], loss: 0.338, per_step_time: 1413ms, lr: 5.600452e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:48,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.65936 samples/s/p 0:03:13 } +2024-07-30 06:07:50,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2990/ 3125], loss: 0.353, per_step_time: 1413ms, lr: 5.4374336e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:50,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.65806 samples/s/p 0:03:10 } +2024-07-30 06:07:53,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2992/ 3125], loss: 0.474, per_step_time: 1413ms, lr: 5.277693e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:53,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.65927 samples/s/p 0:03:08 } +2024-07-30 06:07:56,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2994/ 3125], loss: 0.334, per_step_time: 1413ms, lr: 5.120039e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:56,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.65785 samples/s/p 0:03:05 } +2024-07-30 06:07:59,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2996/ 3125], loss: 0.304, per_step_time: 1413ms, lr: 4.965365e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:07:59,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.66042 samples/s/p 0:03:02 } +2024-07-30 06:08:02,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 2998/ 3125], loss: 0.109, per_step_time: 1413ms, lr: 4.812181e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:02,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.65822 samples/s/p 0:02:59 } +2024-07-30 06:08:05,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3000/ 3125], loss: 0.237, per_step_time: 1413ms, lr: 4.6625734e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:05,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.65811 samples/s/p 0:02:56 } +2024-07-30 06:08:07,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3002/ 3125], loss: 0.179, per_step_time: 1413ms, lr: 4.5138595e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:07,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.65815 samples/s/p 0:02:53 } +2024-07-30 06:08:10,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3004/ 3125], loss: 0.333, per_step_time: 1415ms, lr: 4.3684243e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:10,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.65342 samples/s/p 0:02:51 } +2024-07-30 06:08:13,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3006/ 3125], loss: 0.258, per_step_time: 1413ms, lr: 4.225373e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:13,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.65920 samples/s/p 0:02:48 } +2024-07-30 06:08:16,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3008/ 3125], loss: 0.352, per_step_time: 1414ms, lr: 4.0844084e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:16,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.65653 samples/s/p 0:02:45 } +2024-07-30 06:08:19,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3010/ 3125], loss: 0.381, per_step_time: 1413ms, lr: 3.946125e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:19,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.66082 samples/s/p 0:02:42 } +2024-07-30 06:08:22,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3012/ 3125], loss: 0.166, per_step_time: 1413ms, lr: 3.809929e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:22,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.66072 samples/s/p 0:02:39 } +2024-07-30 06:08:24,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3014/ 3125], loss: 0.362, per_step_time: 1413ms, lr: 3.6761163e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:24,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.65984 samples/s/p 0:02:36 } +2024-07-30 06:08:27,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3016/ 3125], loss: 0.283, per_step_time: 1413ms, lr: 3.544986e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:27,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.66119 samples/s/p 0:02:34 } +2024-07-30 06:08:30,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3018/ 3125], loss: 0.246, per_step_time: 1413ms, lr: 3.4165382e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:30,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.66020 samples/s/p 0:02:31 } +2024-07-30 06:08:33,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3020/ 3125], loss: 0.203, per_step_time: 1413ms, lr: 3.2895802e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:33,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.66093 samples/s/p 0:02:28 } +2024-07-30 06:08:36,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3022/ 3125], loss: 0.099, per_step_time: 1414ms, lr: 3.1656027e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:36,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.65462 samples/s/p 0:02:25 } +2024-07-30 06:08:39,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3024/ 3125], loss: 0.406, per_step_time: 1413ms, lr: 3.043711e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:39,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.65967 samples/s/p 0:02:22 } +2024-07-30 06:08:41,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3026/ 3125], loss: 0.065, per_step_time: 1413ms, lr: 2.9245018e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:41,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.66144 samples/s/p 0:02:19 } +2024-07-30 06:08:44,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3028/ 3125], loss: 0.321, per_step_time: 1414ms, lr: 2.8073788e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:44,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.65489 samples/s/p 0:02:17 } +2024-07-30 06:08:47,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3030/ 3125], loss: 0.028, per_step_time: 1413ms, lr: 2.6926397e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:47,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.65941 samples/s/p 0:02:14 } +2024-07-30 06:08:50,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3032/ 3125], loss: 0.117, per_step_time: 1413ms, lr: 2.580881e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:50,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.65895 samples/s/p 0:02:11 } +2024-07-30 06:08:53,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3034/ 3125], loss: 0.190, per_step_time: 1416ms, lr: 2.4709106e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:53,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.64727 samples/s/p 0:02:08 } +2024-07-30 06:08:56,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3036/ 3125], loss: 0.496, per_step_time: 1414ms, lr: 2.3639202e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:56,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.65730 samples/s/p 0:02:05 } +2024-07-30 06:08:58,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3038/ 3125], loss: 0.532, per_step_time: 1414ms, lr: 2.2587179e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:08:58,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.65552 samples/s/p 0:02:03 } +2024-07-30 06:09:01,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3040/ 3125], loss: 0.358, per_step_time: 1412ms, lr: 2.155602e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:01,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.66262 samples/s/p 0:02:00 } +2024-07-30 06:09:04,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3042/ 3125], loss: 0.352, per_step_time: 1413ms, lr: 2.0557642e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:04,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.65869 samples/s/p 0:01:57 } +2024-07-30 06:09:07,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3044/ 3125], loss: 0.201, per_step_time: 1414ms, lr: 1.9577144e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:07,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.65572 samples/s/p 0:01:54 } +2024-07-30 06:09:10,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3046/ 3125], loss: 0.236, per_step_time: 1413ms, lr: 1.8620491e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:10,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.65910 samples/s/p 0:01:51 } +2024-07-30 06:09:13,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3048/ 3125], loss: 0.417, per_step_time: 1416ms, lr: 1.7693639e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:13,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.64631 samples/s/p 0:01:49 } +2024-07-30 06:09:15,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3050/ 3125], loss: 0.288, per_step_time: 1413ms, lr: 1.6784667e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:15,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.65908 samples/s/p 0:01:46 } +2024-07-30 06:09:18,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3052/ 3125], loss: 0.300, per_step_time: 1415ms, lr: 1.5902519e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:18,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.65230 samples/s/p 0:01:43 } +2024-07-30 06:09:21,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3054/ 3125], loss: 0.165, per_step_time: 1413ms, lr: 1.5044211e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:21,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.65779 samples/s/p 0:01:40 } +2024-07-30 06:09:24,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3056/ 3125], loss: 0.212, per_step_time: 1412ms, lr: 1.4206767e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:24,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.66187 samples/s/p 0:01:37 } +2024-07-30 06:09:27,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3058/ 3125], loss: 0.264, per_step_time: 1413ms, lr: 1.3396143e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:27,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.65894 samples/s/p 0:01:34 } +2024-07-30 06:09:30,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3060/ 3125], loss: 0.296, per_step_time: 1412ms, lr: 1.2612342e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:30,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.66236 samples/s/p 0:01:31 } +2024-07-30 06:09:32,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3062/ 3125], loss: 0.255, per_step_time: 1414ms, lr: 1.1846423e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:32,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.65461 samples/s/p 0:01:29 } +2024-07-30 06:09:35,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3064/ 3125], loss: 0.113, per_step_time: 1413ms, lr: 1.1107325e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:35,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.66087 samples/s/p 0:01:26 } +2024-07-30 06:09:38,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3066/ 3125], loss: 0.314, per_step_time: 1412ms, lr: 1.038909e-09, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:38,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.66225 samples/s/p 0:01:23 } +2024-07-30 06:09:41,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3068/ 3125], loss: 0.279, per_step_time: 1414ms, lr: 9.694695e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:41,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.65746 samples/s/p 0:01:20 } +2024-07-30 06:09:44,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3070/ 3125], loss: 0.359, per_step_time: 1413ms, lr: 9.0271235e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:44,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.66107 samples/s/p 0:01:17 } +2024-07-30 06:09:47,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3072/ 3125], loss: 0.253, per_step_time: 1413ms, lr: 8.380413e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:47,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.65845 samples/s/p 0:01:14 } +2024-07-30 06:09:49,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3074/ 3125], loss: 0.156, per_step_time: 1413ms, lr: 7.7605244e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:49,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.66076 samples/s/p 0:01:12 } +2024-07-30 06:09:52,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3076/ 3125], loss: 0.150, per_step_time: 1412ms, lr: 7.161498e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:52,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.66312 samples/s/p 0:01:09 } +2024-07-30 06:09:55,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3078/ 3125], loss: 0.324, per_step_time: 1413ms, lr: 6.595254e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:55,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.65857 samples/s/p 0:01:06 } +2024-07-30 06:09:58,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3080/ 3125], loss: 0.265, per_step_time: 1414ms, lr: 6.043911e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:09:58,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.65525 samples/s/p 0:01:03 } +2024-07-30 06:10:01,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3082/ 3125], loss: 0.177, per_step_time: 1413ms, lr: 5.5164096e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:01,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.65968 samples/s/p 0:01:00 } +2024-07-30 06:10:04,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3084/ 3125], loss: 0.305, per_step_time: 1415ms, lr: 5.0157306e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:04,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.65355 samples/s/p 0:00:58 } +2024-07-30 06:10:06,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3086/ 3125], loss: 0.515, per_step_time: 1419ms, lr: 4.5418738e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:06,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.63639 samples/s/p 0:00:55 } +2024-07-30 06:10:09,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3088/ 3125], loss: 0.140, per_step_time: 1415ms, lr: 4.0858983e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:09,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.65206 samples/s/p 0:00:52 } +2024-07-30 06:10:12,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3090/ 3125], loss: 0.113, per_step_time: 1414ms, lr: 3.6537645e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:12,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.65662 samples/s/p 0:00:49 } +2024-07-30 06:10:15,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3092/ 3125], loss: 0.268, per_step_time: 1414ms, lr: 3.2514333e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:15,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.65423 samples/s/p 0:00:46 } +2024-07-30 06:10:18,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3094/ 3125], loss: 0.468, per_step_time: 1413ms, lr: 2.8669833e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:18,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.66079 samples/s/p 0:00:43 } +2024-07-30 06:10:21,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3096/ 3125], loss: 0.111, per_step_time: 1412ms, lr: 2.5063754e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:21,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.66220 samples/s/p 0:00:40 } +2024-07-30 06:10:23,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3098/ 3125], loss: 0.240, per_step_time: 1413ms, lr: 2.1785497e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:23,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.65912 samples/s/p 0:00:38 } +2024-07-30 06:10:26,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3100/ 3125], loss: 0.328, per_step_time: 1413ms, lr: 1.8656253e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:26,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.65915 samples/s/p 0:00:35 } +2024-07-30 06:10:29,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3102/ 3125], loss: 0.275, per_step_time: 1413ms, lr: 1.5825033e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:29,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.65949 samples/s/p 0:00:32 } +2024-07-30 06:10:32,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3104/ 3125], loss: 0.162, per_step_time: 1413ms, lr: 1.3172625e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:32,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.66097 samples/s/p 0:00:29 } +2024-07-30 06:10:35,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3106/ 3125], loss: 0.294, per_step_time: 1412ms, lr: 1.0818243e-10, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:35,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.66282 samples/s/p 0:00:26 } +2024-07-30 06:10:38,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3108/ 3125], loss: 0.070, per_step_time: 1413ms, lr: 8.612871e-11, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:38,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.66008 samples/s/p 0:00:24 } +2024-07-30 06:10:40,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3110/ 3125], loss: 0.126, per_step_time: 1425ms, lr: 6.705522e-11, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:40,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.61108 samples/s/p 0:00:21 } +2024-07-30 06:10:43,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3112/ 3125], loss: 0.257, per_step_time: 1413ms, lr: 5.0663945e-11, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:43,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.65837 samples/s/p 0:00:18 } +2024-07-30 06:10:46,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3114/ 3125], loss: 0.175, per_step_time: 1414ms, lr: 3.606081e-11, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:46,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.65633 samples/s/p 0:00:15 } +2024-07-30 06:10:49,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3116/ 3125], loss: 0.208, per_step_time: 1415ms, lr: 2.3841857e-11, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:49,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.65278 samples/s/p 0:00:12 } +2024-07-30 06:10:52,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3118/ 3125], loss: 0.250, per_step_time: 1413ms, lr: 1.4603138e-11, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:52,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.65924 samples/s/p 0:00:09 } +2024-07-30 06:10:55,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3120/ 3125], loss: 0.188, per_step_time: 1414ms, lr: 7.45058e-12, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:55,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.65752 samples/s/p 0:00:07 } +2024-07-30 06:10:57,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3122/ 3125], loss: 0.388, per_step_time: 1413ms, lr: 2.682209e-12, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:10:57,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |█████████████████████████████████████████████████ | 5.65859 samples/s/p 0:00:04 } +2024-07-30 06:11:00,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 3], step:[ 3124/ 3125], loss: 0.206, per_step_time: 1414ms, lr: 2.9802322e-13, overflow cond: False, loss_scale: 1.0 +2024-07-30 06:11:00,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |█████████████████████████████████████████████████ | 5.65745 samples/s/p 0:00:01 } +2024-07-30 06:11:00,848 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-30 06:11:33,330 - mindformers[mindformers/trainer/base_trainer.py:779] - INFO - .........Training Over!............. diff --git "a/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/2. \345\276\256\350\260\203\346\227\245\345\277\227\344\270\216\351\205\215\347\275\256/run_llama3_8b_8k_800T_A2_64G_lora_dis_256.yaml" "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/2. \345\276\256\350\260\203\346\227\245\345\277\227\344\270\216\351\205\215\347\275\256/run_llama3_8b_8k_800T_A2_64G_lora_dis_256.yaml" new file mode 100644 index 00000000..7fc2878e --- /dev/null +++ "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/2. \345\276\256\350\260\203\346\227\245\345\277\227\344\270\216\351\205\215\347\275\256/run_llama3_8b_8k_800T_A2_64G_lora_dis_256.yaml" @@ -0,0 +1,206 @@ +seed: 0 +output_dir: './output' # path to save checkpoint/strategy # last try: 730_float_formatted_10w_r8a16 +load_checkpoint: '/home/ma-user/work/llama3-8B.ckpt' +src_strategy_path_or_dir: '' +auto_trans_ckpt: False # If true, auto transform load_checkpoint to load in distributed model +only_save_strategy: False +resume_training: False +run_mode: 'finetune' + +# trainer config +trainer: + type: CausalLanguageModelingTrainer + model_name: 'llama3_8b' + +# runner config +runner_config: + epochs: 3 + batch_size: 32 + sink_mode: True + sink_size: 2 + +# optimizer +optimizer: + type: FP32StateAdamWeightDecay + beta1: 0.9 + beta2: 0.95 + eps: 1.e-8 + +# lr sechdule +lr_schedule: + type: CosineWithWarmUpLR + learning_rate: 1.e-5 + lr_end: 0.0 + warmup_ratio: 0.03 + total_steps: -1 # -1 means it will load the total steps of the dataset + +# dataset +train_dataset: &train_dataset + data_loader: + type: MindDataset + dataset_dir: "/home/ma-user/work/train-fastchat256_ranked.mindrecord" + shuffle: True + input_columns: ["input_ids", "labels"] # "input_ids", "labels" , labels are used in instruction finetune. + num_parallel_workers: 8 + python_multiprocessing: False + drop_remainder: True + batch_size: 32 + repeat: 1 + numa_enable: False + prefetch_size: 1 +train_dataset_task: + type: CausalLanguageModelDataset + dataset_config: *train_dataset +# if True, do evaluate during the training process. if false, do nothing. +# note that the task trainer should support _evaluate_in_training function. +do_eval: False + +# eval dataset +eval_dataset: &eval_dataset + data_loader: + type: MindDataset + dataset_dir: "" + shuffle: False + input_columns: ["input_ids"] + num_parallel_workers: 8 + python_multiprocessing: False + drop_remainder: False + repeat: 1 + numa_enable: False + prefetch_size: 1 +eval_dataset_task: + type: CausalLanguageModelDataset + dataset_config: *eval_dataset + +use_parallel: True +# parallel context config +parallel: + parallel_mode: 1 # 0-data parallel, 1-semi-auto parallel, 2-auto parallel, 3-hybrid parallel + gradients_mean: False + enable_alltoall: False + full_batch: True + search_mode: "sharding_propagation" + enable_parallel_optimizer: True + strategy_ckpt_config: + save_file: "./ckpt_strategy.ckpt" + only_trainable_params: False + parallel_optimizer_config: + gradient_accumulation_shard: False + parallel_optimizer_threshold: 64 +# default parallel of device num = 8 for Atlas 800T A2 +parallel_config: + data_parallel: 1 + model_parallel: 4 + pipeline_stage: 1 + use_seq_parallel: False + micro_batch_num: 1 + vocab_emb_dp: True + gradient_aggregation_group: 4 +# when model parallel is greater than 1, we can set micro_batch_interleave_num=2, that may accelerate the train process. +micro_batch_interleave_num: 1 + +# recompute config +recompute_config: + recompute: True + select_recompute: False + parallel_optimizer_comm_recompute: False + mp_comm_recompute: True + recompute_slice_activation: True + +# callbacks +callbacks: + - type: MFLossMonitor + - type: CheckpointMointor + prefix: "llama3_8b" + save_checkpoint_steps: 1400 + integrated_save: False + async_save: False + - type: ObsMonitor + +# mindspore context init config +context: + mode: 0 #0--Graph Mode; 1--Pynative Mode + device_target: "Ascend" + enable_graph_kernel: False + graph_kernel_flags: "--disable_expand_ops=Softmax,Dropout --enable_parallel_fusion=true --reduce_fuse_depth=8 --enable_auto_tensor_inplace=true" + max_call_depth: 10000 + max_device_memory: "26GB" + save_graphs: False + save_graphs_path: "./graph" + device_id: 0 + runtime_num_threads: 1 + +# model config +model: + model_config: + type: LlamaConfig + batch_size: 32 # add for increase predict + seq_length: 256 + hidden_size: 4096 + num_layers: 32 + num_heads: 32 + n_kv_heads: 8 + vocab_size: 128256 + intermediate_size: 14336 + rms_norm_eps: 1.0e-5 + bos_token_id: 128000 + eos_token_id: 128001 + pad_token_id: 128002 + ignore_token_id: -100 + compute_dtype: "bfloat16" + layernorm_compute_type: "float32" + softmax_compute_type: "float32" + rotary_dtype: "float32" + param_init_type: "bfloat16" + use_past: False + scaling_factor: 1.0 + theta: 500000 + extend_method: "None" # support "None", "PI", "NTK" + use_flash_attention: True # FA can accelerate training or finetune + offset: 0 + fine_grain_interleave: 1 + checkpoint_name_or_path: "/home/ma-user/work/ms_ckpt/llama3-8B.ckpt" + repetition_penalty: 1 + max_decode_length: 512 + top_k: 3 + top_p: 1 + do_sample: False + pet_config: + pet_type: lora + # configuration of lora + lora_rank: 8 + lora_alpha: 16 + lora_dropout: 0.0 + target_modules: '.*wq|.*wv' + arch: + type: LlamaForCausalLM + +# metric +metric: + type: PerplexityMetric + +# wrapper cell config +runner_wrapper: + type: MFTrainOneStepCell + scale_sense: 1.0 + use_clip_grad: True + +eval_callbacks: + - type: ObsMonitor + +auto_tune: False +filepath_prefix: './autotune' +autotune_per_step: 10 + +profile: False +profile_start_step: 4 +profile_stop_step: 8 +init_start_profile: False +profile_communication: False +profile_memory: True +layer_scale: False +layer_decay: 0.65 +lr_scale_factor: 256 + +# aicc +remote_save_url: "Please input obs url on AICC platform." diff --git "a/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/4. \345\216\237\346\234\211\350\203\275\345\212\233\346\265\213\350\257\204\346\227\245\345\277\227/730_eval_min_token_equ_1_log" "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/4. \345\216\237\346\234\211\350\203\275\345\212\233\346\265\213\350\257\204\346\227\245\345\277\227/730_eval_min_token_equ_1_log" new file mode 100644 index 00000000..b4d0755e --- /dev/null +++ "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/4. \345\216\237\346\234\211\350\203\275\345\212\233\346\265\213\350\257\204\346\227\245\345\277\227/730_eval_min_token_equ_1_log" @@ -0,0 +1,45002 @@ +2024-07-30 13:29:02,673 - mindformers[mindformers/tools/utils.py:153] - INFO - set output path to '/home/ma-user/work/mindformers/output' +2024-07-30 13:29:02,695 - mindformers[mindformers/trainer/trainer.py:919] - INFO - Load configs in /home/ma-user/work/mindformers/configs/general/run_general_task.yaml to build trainer. +2024-07-30 13:29:02,695 - mindformers[mindformers/trainer/trainer.py:949] - INFO - ..........Init Config.......... +2024-07-30 13:29:02,696 - mindformers[mindformers/core/parallel_config.py:45] - INFO - initial recompute_config from dict: {'recompute': False, 'select_recompute': False, 'parallel_optimizer_comm_recompute': False, 'mp_comm_recompute': True, 'recompute_slice_activation': True} +2024-07-30 13:29:02,696 - mindformers[mindformers/core/parallel_config.py:51] - INFO - initial parallel_config from dict: {'data_parallel': 1, 'model_parallel': 1, 'pipeline_stage': 1, 'use_seq_parallel': False, 'micro_batch_num': 1, 'vocab_emb_dp': True, 'gradient_aggregation_group': 4} +2024-07-30 13:29:02,696 - mindformers[mindformers/tools/utils.py:153] - INFO - set output path to '/home/ma-user/work/mindformers/output' +2024-07-30 13:29:02,697 - mindformers[mindformers/tools/utils.py:168] - INFO - set strategy path to './output/strategy/ckpt_strategy_rank_0.ckpt' +2024-07-30 13:29:02,697 - mindformers[mindformers/trainer/base_trainer.py:85] - INFO - Now Running Task is: text_generation, Model is: llama3_8b +2024-07-30 13:29:02,697 - mindformers[mindformers/trainer/base_trainer.py:111] - WARNING - Input model name is not in the supported list or unspecified. +2024-07-30 13:29:02,697 - mindformers[mindformers/trainer/base_trainer.py:112] - WARNING - See the list of supported task and model name: ['baichuan2_13b', 'baichuan2_7b', 'baichuan_7b', 'bloom_176b', 'bloom_560m', 'bloom_65b', 'bloom_7.1b', 'codegeex2_6b', 'codellama_34b', 'common', 'deepseek_33b', 'glm2_6b', 'glm2_6b_lora', 'glm2_6b_ptuning2', 'glm3_6b', 'glm_6b', 'glm_6b_chat', 'glm_6b_lora', 'glm_6b_lora_chat', 'gpt2', 'gpt2_13b', 'gpt2_52b', 'gpt2_lora', 'gpt2_xl', 'gpt2_xl_lora', 'internlm_7b', 'internlm_7b_lora', 'llama2_13b', 'llama2_70b', 'llama2_7b', 'llama_13b', 'llama_65b', 'llama_7b', 'llama_7b_lora', 'pangualpha_13b', 'pangualpha_2_6b', 'qwen_7b', 'qwen_7b_lora', 'skywork_13b', 'yi_34b', 'yi_6b', 'ziya_13b'] +2024-07-30 13:29:02,698 - mindformers[mindformers/trainer/base_trainer.py:113] - WARNING - The default model config: /home/ma-user/work/mindformers/configs/gpt2/run_gpt2.yaml will now be used for the text_generation task +2024-07-30 13:29:02,698 - mindformers[mindformers/trainer/trainer.py:1004] - INFO - ..........Init Model.......... +2024-07-30 13:29:02,698 - mindformers[mindformers/trainer/trainer.py:335] - INFO - ==========Trainer Init Success!========== +2024-07-30 13:29:02,698 - mindformers[mindformers/trainer/trainer.py:1004] - INFO - ..........Init Model.......... +2024-07-30 13:29:02,699 - mindformers[mindformers/trainer/base_trainer.py:213] - INFO - The current parallel mode is stand_alone, batch size per card will not be changed: batch_size_per_card = 1 +2024-07-30 13:29:02,699 - mindformers[mindformers/trainer/base_trainer.py:217] - INFO - global_batch_size = batch_size_per_card * device_num * gradient_accumulation_steps = 1 = 1 * 1 * 1 +2024-07-30 13:29:02,699 - mindformers[mindformers/trainer/base_trainer.py:226] - INFO - parallel_config will be change to default config: [ParallelConfig] +_recompute:[ParallelConfig] +_recompute:False +_select_recompute:False +_select_comm_recompute:False +_parallel_optimizer_comm_recompute:False +_mp_comm_recompute:True +_recompute_slice_activation:True + +select_recompute:False +use_seq_parallel:False +_optimizer_shard:None +_gradient_aggregation_group:4 +_embed_dp_mp_config:[ParallelConfig] +_dp_mp_config:[ParallelConfig] +_data_parallel:1 +_model_parallel:1 +use_seq_parallel:False +select_recompute:False + +_vocab_emb_dp:True +use_seq_parallel:False +select_recompute:False + +_pp_config:[ParallelConfig] +_pipeline_stage:1 +_micro_batch_num:1 + +_moe_config:[ParallelConfig] +_dpmp:[ParallelConfig] +_data_parallel:1 +_model_parallel:1 +use_seq_parallel:False +select_recompute:False + +_expert_parallel:1 +use_seq_parallel:False +select_recompute:False + +. +2024-07-30 13:29:02,700 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:193] - INFO - .........Build Dataset For Evaluate.......... +2024-07-30 13:29:02,700 - mindformers[mindformers/trainer/base_trainer.py:360] - INFO - .........Build Dataset From Config.......... +2024-07-30 13:29:02,700 - mindformers[mindformers/trainer/base_trainer.py:379] - INFO - For evaluate phase, batch size for eval dataset is 1, different from training, not multiplied by micro_batch_num, micro_batch_interleave_num and gradient_accumulation_steps +2024-07-30 13:29:02,701 - mindformers[mindformers/dataset/causal_language_model_dataset.py:166] - INFO - Now Create Causal Language Model Dataset. +2024-07-30 13:29:02,711 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:196] - INFO - Create evaluate dataset finish, dataset size:2067 +2024-07-30 13:29:02,714 - mindformers[mindformers/trainer/base_trainer.py:387] - INFO - .........Build Network From Config.......... +2024-07-30 13:29:02,715 - mindformers[mindformers/version_control.py:61] - INFO - The Cell Reuse compilation acceleration feature is not supported when the environment variable ENABLE_CELL_REUSE is 0 or MindSpore version is earlier than 2.1.0 or stand_alone mode or pipeline_stages <= 1 +2024-07-30 13:29:02,715 - mindformers[mindformers/version_control.py:65] - INFO - +The current ENABLE_CELL_REUSE=0, please set the environment variable as follows: +export ENABLE_CELL_REUSE=1 to enable the Cell Reuse compilation acceleration feature. +2024-07-30 13:29:02,715 - mindformers[mindformers/version_control.py:71] - INFO - The Cell Reuse compilation acceleration feature does not support single-card mode.This feature is disabled by default. ENABLE_CELL_REUSE=1 does not take effect. +2024-07-30 13:29:02,715 - mindformers[mindformers/version_control.py:74] - INFO - The Cell Reuse compilation acceleration feature only works in pipeline parallel mode(pipeline_stage>1).Current pipeline stage=1, the feature is disabled by default. +2024-07-30 13:29:35,166 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 13:29:37,875 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 13:29:40,537 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 13:29:43,194 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 13:29:45,868 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 13:29:48,571 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 13:29:51,260 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 13:29:53,996 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 13:29:56,738 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 13:29:59,464 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-30 13:31:03,978 - mindformers[mindformers/models/modeling_utils.py:1438] - INFO - model built, but weights is unloaded, since the config has no checkpoint_name_or_path attribute or checkpoint_name_or_path is None. +2024-07-30 13:31:03,979 - mindformers[mindformers/models/modeling_utils.py:591] - INFO - Set jit config for jit level:O0 and infer boost:on. +2024-07-30 13:31:03,996 - mindformers[mindformers/trainer/base_trainer.py:543] - INFO - Network Parameters: 8030261248. +2024-07-30 13:31:03,996 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:210] - INFO - .........Build Compute Metrics For Evaluate.......... +2024-07-30 13:31:03,997 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:217] - INFO - .........Build tokenizer For Evaluate.......... +2024-07-30 13:31:05,105 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:221] - INFO - .........Starting Init Evaluate Model.......... +2024-07-30 13:31:05,105 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:228] - INFO - .............Start load checkpoint for eval.................. +2024-07-30 13:31:05,149 - mindformers[mindformers/trainer/utils.py:736] - INFO - ............Start load checkpoint from checkpoint............ +2024-07-30 13:44:38,123 - mindformers[mindformers/trainer/utils.py:767] - INFO - Network parameters are not loaded: (['model.layers.0.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.0.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.1.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.1.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.2.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.2.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.3.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.3.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.4.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.4.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.5.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.5.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.6.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.6.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.7.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.7.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.8.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.8.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.9.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.9.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.10.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.10.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.11.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.11.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.12.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.12.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.13.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.13.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.14.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.14.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.15.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.15.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.16.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.16.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.17.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.17.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.18.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.18.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.19.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.19.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.20.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.20.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.21.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.21.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.22.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.22.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.23.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.23.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.24.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.24.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.25.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.25.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.26.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.26.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.27.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.27.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.28.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.28.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.29.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.29.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.30.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.30.attention.infer_attention.paged_attention_mgr.value_cache', 'model.layers.31.attention.infer_attention.paged_attention_mgr.key_cache', 'model.layers.31.attention.infer_attention.paged_attention_mgr.value_cache'], ['scale_sense', 'global_step', 'epoch_num', 'step_num', 'loss_scale']) +2024-07-30 13:44:38,126 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:236] - INFO - .........Starting Evaluate Model.......... +{'auto_trans_ckpt': False, + 'auto_tune': False, + 'autotune_per_step': 10, + 'callbacks': [OrderedDict([('type', 'MFLossMonitor')]), + OrderedDict([('type', 'CheckpointMointor'), + ('prefix', 'llama3_8b'), + ('save_checkpoint_steps', 10000), + ('integrated_save', False), + ('async_save', False)]), + OrderedDict([('type', 'ObsMonitor')])], + 'context': {'device_id': 0, + 'device_target': 'Ascend', + 'enable_graph_kernel': False, + 'graph_kernel_flags': '--disable_expand_ops=Softmax,Dropout ' + '--enable_parallel_fusion=true ' + '--reduce_fuse_depth=8 ' + '--enable_auto_tensor_inplace=true', + 'max_call_depth': 10000, + 'runtime_num_threads': 1, + 'save_graphs': False, + 'save_graphs_path': './graph'}, + 'device_num': 1, + 'do_eval': False, + 'eval_callbacks': [OrderedDict([('type', 'ObsMonitor')])], + 'eval_dataset': {'auto_tune': False, + 'autotune_per_step': 10, + 'batch_size': 1, + 'data_loader': {'dataset_dir': '/home/ma-user/work/mindformers/squad8192.mindrecord', + 'shuffle': False, + 'type': 'MindDataset'}, + 'do_eval': True, + 'drop_remainder': False, + 'filepath_prefix': './autotune', + 'input_columns': ['input_ids', 'labels'], + 'num_parallel_workers': 8, + 'numa_enable': False, + 'output_columns': ['input_ids', 'labels'], + 'prefetch_size': 1, + 'profile': False, + 'python_multiprocessing': False, + 'repeat': 1, + 'seed': 0}, + 'eval_dataset_task': {'dataset_config': {'auto_tune': False, + 'autotune_per_step': 10, + 'batch_size': 1, + 'data_loader': {'dataset_dir': '/home/ma-user/work/mindformers/squad8192.mindrecord', + 'shuffle': False, + 'type': 'MindDataset'}, + 'do_eval': True, + 'drop_remainder': False, + 'filepath_prefix': './autotune', + 'input_columns': ['input_ids', + 'labels'], + 'num_parallel_workers': 8, + 'numa_enable': False, + 'output_columns': ['input_ids', + 'labels'], + 'prefetch_size': 1, + 'profile': False, + 'python_multiprocessing': False, + 'repeat': 1, + 'seed': 0}, + 'type': 'CausalLanguageModelDataset'}, + 'filepath_prefix': './autotune', + 'init_start_profile': False, + 'layer_decay': 0.65, + 'layer_scale': False, + 'load_checkpoint': '/home/ma-user/work/mindformers/research/output/checkpoint/merged_lora.ckpt', + 'local_rank': 0, + 'lr_scale_factor': 256, + 'lr_schedule': {'learning_rate': 5e-05, + 'lr_end': 0.0, + 'total_steps': -1, + 'type': 'CosineWithWarmUpLR', + 'warmup_ratio': 0.03}, + 'metric': [{'type': 'EmF1Metric'}], + 'micro_batch_interleave_num': 1, + 'model': {'arch': {'type': 'LlamaForCausalLM'}, + 'model_config': {'batch_size': 1, + 'bos_token_id': 128000, + 'checkpoint_name_or_path': None, + 'compute_dtype': 'float16', + 'do_sample': False, + 'eos_token_id': 128001, + 'extend_method': 'None', + 'fine_grain_interleave': 1, + 'hidden_size': 4096, + 'ignore_token_id': -100, + 'intermediate_size': 14336, + 'layernorm_compute_type': 'float32', + 'max_decode_length': 700, + 'max_new_tokens': 20, + 'min_new_tokens': 1, + 'n_kv_heads': 8, + 'num_heads': 32, + 'num_layers': 32, + 'offset': 0, + 'pad_token_id': 128002, + 'param_init_type': 'float16', + 'repetition_penalty': 1, + 'rms_norm_eps': 1e-05, + 'rotary_dtype': 'float32', + 'scaling_factor': 1.0, + 'seq_length': 8192, + 'softmax_compute_type': 'float32', + 'theta': 500000, + 'top_k': 3, + 'top_p': 1, + 'type': 'LlamaConfig', + 'use_flash_attention': False, + 'use_past': True, + 'vocab_size': 128256}}, + 'moe_config': , + 'only_save_strategy': False, + 'optimizer': {'beta1': 0.9, + 'beta2': 0.95, + 'eps': 1e-08, + 'learning_rate': 5e-05, + 'type': 'FP32StateAdamWeightDecay'}, + 'output_dir': './output', + 'parallel': {'enable_alltoall': False, + 'enable_parallel_optimizer': False, + 'full_batch': True, + 'gradients_mean': False, + 'parallel_mode': 1, + 'parallel_optimizer_config': {'gradient_accumulation_shard': False, + 'parallel_optimizer_threshold': 64}, + 'search_mode': 'sharding_propagation', + 'strategy_ckpt_save_file': './output/strategy/ckpt_strategy_rank_0.ckpt'}, + 'parallel_config': , + 'processor': {'return_tensors': 'ms', + 'tokenizer': {'model_max_length': 8192, + 'pad_token': '<|reserved_special_token_0|>', + 'type': 'Llama3Tokenizer', + 'vocab_file': '/home/ma-user/work/tokenizer.model'}, + 'type': 'LlamaProcessor'}, + 'profile': False, + 'profile_communication': False, + 'profile_memory': True, + 'profile_start_step': 4, + 'profile_stop_step': 8, + 'rank_id': 0, + 'recompute_config': , + 'remote_save_url': 'Please input obs url on AICC platform.', + 'resume_training': False, + 'run_mode': 'eval', + 'runner_config': {'batch_size': 1, + 'epochs': 1, + 'gradient_accumulation_steps': 1, + 'sink_mode': True, + 'sink_size': 2}, + 'runner_wrapper': {'scale_sense': 1.0, + 'type': 'MFTrainOneStepCell', + 'use_clip_grad': True}, + 'seed': 0, + 'src_strategy_path_or_dir': '', + 'train_dataset': {'auto_tune': False, + 'autotune_per_step': 10, + 'batch_size': 1, + 'data_loader': {'dataset_dir': '', + 'shuffle': True, + 'type': 'MindDataset'}, + 'do_eval': False, + 'drop_remainder': True, + 'filepath_prefix': './autotune', + 'input_columns': ['input_ids'], + 'num_parallel_workers': 8, + 'numa_enable': False, + 'output_columns': ['input_ids'], + 'prefetch_size': 1, + 'profile': False, + 'python_multiprocessing': False, + 'repeat': 1, + 'seed': 0}, + 'train_dataset_task': {'dataset_config': {'auto_tune': False, + 'autotune_per_step': 10, + 'batch_size': 1, + 'data_loader': {'dataset_dir': '', + 'shuffle': True, + 'type': 'MindDataset'}, + 'do_eval': False, + 'drop_remainder': True, + 'filepath_prefix': './autotune', + 'input_columns': ['input_ids'], + 'num_parallel_workers': 8, + 'numa_enable': False, + 'output_columns': ['input_ids'], + 'prefetch_size': 1, + 'profile': False, + 'python_multiprocessing': False, + 'repeat': 1, + 'seed': 0}, + 'type': 'CausalLanguageModelDataset'}, + 'trainer': {'model_name': 'llama3_8b', + 'type': 'CausalLanguageModelingTrainer'}, + 'use_parallel': False} +2024-07-30 13:44:38,179 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:44:38,179 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 213, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:44:38,180 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:44:38,180 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:44:38,181 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:45:14,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:27,431 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:27,475 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:27,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:27,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:27,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:27,610 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:27,641 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:27,672 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:27,703 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:27,860 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 49.67879033088684 s; generated tokens: 15 tokens; generate speed: 0.30193971914557743 tokens/s +2024-07-30 13:45:27,865 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:45:27,865 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1/2067], cost time 49.6934s, every example cost time is 49.6934, generate speed: 0.3019 tokens/s, avg speed: 0.0000 tokens/s, remaining time: 0:00:00 +pred is: + ['Denver Broncos'] + label is: + ['Denver Broncos'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:45:29,293 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:45:29,294 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 181, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:45:29,294 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:29,295 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:45:29,295 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:45:30,238 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:30,279 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:30,311 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:30,342 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:30,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:30,404 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:30,435 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:30,466 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:30,497 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:30,528 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:30,813 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.518347978591919 s; generated tokens: 19 tokens; generate speed: 12.513600484139456 tokens/s +2024-07-30 13:45:30,818 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:45:30,818 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2/2067], cost time 1.5303s, every example cost time is 1.5303, generate speed: 12.4158 tokens/s, avg speed: 12.4150 tokens/s, remaining time: 0:26:20 +pred is: + ['Cam Newton'] + label is: + ['Cam Newton'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:45:30,901 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:45:30,901 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 119, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:45:30,902 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:30,902 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:45:30,902 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:45:31,844 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:31,877 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:31,909 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:31,939 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:31,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:32,001 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:32,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:32,063 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:32,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:32,125 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:32,440 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.538034200668335 s; generated tokens: 20 tokens; generate speed: 13.003612007658369 tokens/s +2024-07-30 13:45:32,445 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:45:32,445 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[3/2067], cost time 1.5492s, every example cost time is 1.5492, generate speed: 12.9099 tokens/s, avg speed: 12.6640 tokens/s, remaining time: 0:35:18 +pred is: + ['Von Miller'] + label is: + ['Von Miller'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:45:32,528 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:45:32,528 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 140, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:45:32,529 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:32,529 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:45:32,529 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:45:33,471 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:33,513 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:33,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:33,548 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0181856155395508 s; generated tokens: 3 tokens; generate speed: 2.946417582623438 tokens/s +2024-07-30 13:45:33,552 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:45:33,553 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[4/2067], cost time 1.0292s, every example cost time is 1.0292, generate speed: 2.9149 tokens/s, avg speed: 10.2219 tokens/s, remaining time: 0:35:19 +pred is: + ['CBS'] + label is: + ['CBS'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:45:33,635 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:45:33,635 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 92, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:45:33,635 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:33,636 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:45:33,636 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:45:34,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:34,609 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:34,640 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:34,671 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:34,702 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:34,732 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:34,763 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:34,794 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:34,824 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:34,855 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:35,166 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.530038595199585 s; generated tokens: 20 tokens; generate speed: 13.071565686479374 tokens/s +2024-07-30 13:45:35,171 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:45:35,171 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[5/2067], cost time 1.5411s, every example cost time is 1.5411, generate speed: 12.9780 tokens/s, avg speed: 10.9737 tokens/s, remaining time: 0:38:50 +pred is: + ['Roger Goodell'] + label is: + ['Roger Goodell'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:45:35,254 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:45:35,254 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 88, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:45:35,254 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:35,255 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:45:35,255 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:45:36,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:36,228 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:36,259 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:36,290 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:36,321 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:36,352 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:36,382 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:36,413 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:36,444 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:36,475 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:36,792 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5367236137390137 s; generated tokens: 20 tokens; generate speed: 13.014702072116828 tokens/s +2024-07-30 13:45:36,796 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:45:36,797 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[6/2067], cost time 1.5477s, every example cost time is 1.5477, generate speed: 12.9223 tokens/s, avg speed: 11.3927 tokens/s, remaining time: 0:41:12 +pred is: + ['1'] + label is: + ["New Orleans' Mercedes-Benz Superdome"] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:45:36,880 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:45:36,880 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 195, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:45:36,881 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:36,881 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:45:36,881 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:45:37,824 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:37,857 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:37,887 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:37,918 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:37,949 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:37,980 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:38,010 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:38,041 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:38,072 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:38,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:38,142 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2607908248901367 s; generated tokens: 11 tokens; generate speed: 8.724682780713067 tokens/s +2024-07-30 13:45:38,147 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:45:38,147 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[7/2067], cost time 1.2718s, every example cost time is 1.2718, generate speed: 8.6492 tokens/s, avg speed: 10.9807 tokens/s, remaining time: 0:41:32 +pred is: + ['2012'] + label is: + ['October 16, 2012'] +The F1/Em of this example is: {'F1': 28.57142857142857, 'Em': 0.0} +2024-07-30 13:45:38,229 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:45:38,230 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 137, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:45:38,230 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:38,230 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:45:38,230 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:45:39,172 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:39,205 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:39,236 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:39,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:39,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:39,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:39,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:39,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:39,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:39,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:39,649 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4188182353973389 s; generated tokens: 16 tokens; generate speed: 11.276990667884398 tokens/s +2024-07-30 13:45:39,654 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:45:39,655 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[8/2067], cost time 1.4301s, every example cost time is 1.4301, generate speed: 11.1880 tokens/s, avg speed: 11.0107 tokens/s, remaining time: 0:42:27 +pred is: + ['2013'] + label is: + ['May 21, 2013'] +The F1/Em of this example is: {'F1': 28.57142857142857, 'Em': 0.0} +2024-07-30 13:45:39,743 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:45:39,743 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 201, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:45:39,744 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:39,744 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:45:39,744 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:45:40,688 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:40,721 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:40,757 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:40,788 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:40,819 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:40,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:40,881 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:40,912 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:40,945 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:40,976 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:41,285 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5406227111816406 s; generated tokens: 20 tokens; generate speed: 12.98176370816981 tokens/s +2024-07-30 13:45:41,290 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:45:41,290 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[9/2067], cost time 1.5522s, every example cost time is 1.5522, generate speed: 12.8851 tokens/s, avg speed: 11.2647 tokens/s, remaining time: 0:43:38 +pred is: + ['1'] + label is: + ['John Fox'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:45:41,373 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:45:41,373 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 234, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:45:41,374 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:41,374 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:45:41,374 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:45:42,318 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:42,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:42,383 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:42,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:42,446 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:42,477 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:42,508 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:42,539 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:42,570 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:42,600 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:42,761 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3871822357177734 s; generated tokens: 15 tokens; generate speed: 10.81328726231742 tokens/s +2024-07-30 13:45:42,766 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:45:42,766 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[10/2067], cost time 1.3983s, every example cost time is 1.3983, generate speed: 10.7276 tokens/s, avg speed: 11.2063 tokens/s, remaining time: 0:44:03 +pred is: + ['1'] + label is: + ['DeAngelo Williams'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 55.71428571428571, Em score: 50.0, current_count: 10 +2024-07-30 13:45:42,851 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:45:42,851 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 334, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:45:42,851 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:42,852 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:45:42,852 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:45:43,796 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:43,828 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:43,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:43,862 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0102424621582031 s; generated tokens: 3 tokens; generate speed: 2.9695841467513 tokens/s +2024-07-30 13:45:43,867 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:45:43,867 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[11/2067], cost time 1.0212s, every example cost time is 1.0212, generate speed: 2.9378 tokens/s, avg speed: 10.5976 tokens/s, remaining time: 0:43:12 +pred is: + ['6'] + label is: + ['six'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:45:43,950 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:45:43,950 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 297, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:45:43,951 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:43,951 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:45:43,951 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:45:44,895 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:44,927 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:44,958 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:44,989 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:45,020 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:45,051 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:45,082 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:45,113 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:45,144 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:45,146 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1952509880065918 s; generated tokens: 9 tokens; generate speed: 7.529799255811504 tokens/s +2024-07-30 13:45:45,151 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:45:45,151 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[12/2067], cost time 1.2062s, every example cost time is 1.2062, generate speed: 7.4613 tokens/s, avg speed: 10.3467 tokens/s, remaining time: 0:43:01 +pred is: + ['308'] + label is: + ['308'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:45:45,239 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:45:45,239 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 469, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:45:45,240 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:45,240 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:45:45,240 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:45:46,187 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:46,220 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:46,251 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:46,282 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:46,313 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:46,344 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:46,380 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:46,412 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:46,443 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:46,474 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:46,508 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2676384449005127 s; generated tokens: 11 tokens; generate speed: 8.677553165298097 tokens/s +2024-07-30 13:45:46,513 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:45:46,513 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[13/2067], cost time 1.2789s, every example cost time is 1.2789, generate speed: 8.6012 tokens/s, avg speed: 10.2102 tokens/s, remaining time: 0:43:04 +pred is: + ['Gary Kubiak'] + label is: + ['Gary Kubiak'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:45:46,595 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:45:46,596 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 270, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:45:46,596 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:46,596 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:45:46,596 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:45:47,540 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:47,573 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:47,603 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:47,634 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:47,665 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:47,668 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.071436882019043 s; generated tokens: 5 tokens; generate speed: 4.666630469708932 tokens/s +2024-07-30 13:45:47,673 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:45:47,673 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[14/2067], cost time 1.0824s, every example cost time is 1.0824, generate speed: 4.6196 tokens/s, avg speed: 9.8632 tokens/s, remaining time: 0:42:37 +pred is: + ['67.9'] + label is: + ['67.9'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:45:47,755 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:45:47,756 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 207, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:45:47,756 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:47,756 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:45:47,757 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:45:48,699 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:48,731 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:48,762 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:48,793 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:48,823 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:48,826 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0694465637207031 s; generated tokens: 5 tokens; generate speed: 4.675315410434851 tokens/s +2024-07-30 13:45:48,831 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:45:48,831 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[15/2067], cost time 1.0803s, every example cost time is 1.0803, generate speed: 4.6281 tokens/s, avg speed: 9.5578 tokens/s, remaining time: 0:42:13 +pred is: + ['4,530'] + label is: + ['4,530'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:45:48,921 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:45:48,921 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 130, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:45:48,921 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:48,922 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:45:48,922 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:45:49,863 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:49,895 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:49,926 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:49,957 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:49,988 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:50,019 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:50,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:50,080 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:50,111 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:50,141 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:50,266 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3434441089630127 s; generated tokens: 14 tokens; generate speed: 10.420976880687967 tokens/s +2024-07-30 13:45:50,270 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:45:50,270 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[16/2067], cost time 1.3545s, every example cost time is 1.3545, generate speed: 10.3363 tokens/s, avg speed: 9.6109 tokens/s, remaining time: 0:42:27 +pred is: + ['Seattle Seahawks'] + label is: + ['Seattle Seahawks'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:45:50,353 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:45:50,353 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 148, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:45:50,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:50,354 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:45:50,354 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:45:51,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:51,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:51,362 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:51,393 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:51,425 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:51,459 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:51,490 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:51,520 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:51,551 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:51,582 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:51,894 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5392839908599854 s; generated tokens: 20 tokens; generate speed: 12.993053990528521 tokens/s +2024-07-30 13:45:51,898 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:45:51,899 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[17/2067], cost time 1.5504s, every example cost time is 1.5504, generate speed: 12.9001 tokens/s, avg speed: 9.8489 tokens/s, remaining time: 0:43:03 +pred is: + ['Pittsburgh Steelers'] + label is: + ['Pittsburgh Steelers'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:45:51,981 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:45:51,982 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 113, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:45:51,982 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:51,982 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:45:51,983 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:45:52,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:52,961 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:52,992 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:53,023 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:53,054 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:53,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:53,115 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:53,146 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:53,177 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:53,208 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:53,333 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3497228622436523 s; generated tokens: 14 tokens; generate speed: 10.372499712072534 tokens/s +2024-07-30 13:45:53,337 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:45:53,337 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[18/2067], cost time 1.3608s, every example cost time is 1.3608, generate speed: 10.2877 tokens/s, avg speed: 9.8751 tokens/s, remaining time: 0:43:13 +pred is: + ['Thomas Davis'] + label is: + ['Thomas Davis'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:45:53,426 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:45:53,426 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 130, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:45:53,427 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:53,427 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:45:53,427 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:45:54,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:54,401 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:54,432 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:54,435 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0076117515563965 s; generated tokens: 3 tokens; generate speed: 2.9773372485643232 tokens/s +2024-07-30 13:45:54,440 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:45:54,440 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[19/2067], cost time 1.0188s, every example cost time is 1.0188, generate speed: 2.9446 tokens/s, avg speed: 9.5785 tokens/s, remaining time: 0:42:45 +pred is: + ['39'] + label is: + ['39'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:45:54,529 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:45:54,530 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:45:54,530 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:54,531 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:45:54,531 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:45:55,473 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:55,506 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:55,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:55,575 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:55,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:55,637 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:55,668 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:55,698 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:55,729 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:55,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:55,946 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.414794683456421 s; generated tokens: 16 tokens; generate speed: 11.309061439862866 tokens/s +2024-07-30 13:45:55,950 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:45:55,951 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[20/2067], cost time 1.4260s, every example cost time is 1.4260, generate speed: 11.2199 tokens/s, avg speed: 9.6712 tokens/s, remaining time: 0:43:02 +pred is: + ['1998'] + label is: + ['1998'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 72.85714285714286, Em score: 70.0, current_count: 20 +2024-07-30 13:45:56,042 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:45:56,042 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 104, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:45:56,043 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:56,043 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:45:56,043 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:45:56,984 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:57,016 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:57,048 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:57,078 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:57,109 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:57,139 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:57,174 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:57,205 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:57,236 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:57,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:57,361 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3178915977478027 s; generated tokens: 13 tokens; generate speed: 9.864240748037407 tokens/s +2024-07-30 13:45:57,366 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:45:57,366 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[21/2067], cost time 1.3292s, every example cost time is 1.3292, generate speed: 9.7802 tokens/s, avg speed: 9.6767 tokens/s, remaining time: 0:43:07 +pred is: + ['XX'] + label is: + ['Super Bowl XX'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +2024-07-30 13:45:57,448 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:45:57,449 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 243, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:45:57,449 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:57,449 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:45:57,450 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:45:58,393 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:58,427 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:58,459 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:58,490 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:58,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:58,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:58,584 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:58,614 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:58,645 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:58,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:58,985 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5356090068817139 s; generated tokens: 20 tokens; generate speed: 13.024148666992403 tokens/s +2024-07-30 13:45:58,990 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:45:58,990 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[22/2067], cost time 1.5468s, every example cost time is 1.5468, generate speed: 12.9300 tokens/s, avg speed: 9.8557 tokens/s, remaining time: 0:43:32 +pred is: + ['Justin Tucker'] + label is: + ['Justin Tucker'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:45:59,072 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:45:59,073 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 272, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:45:59,073 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:45:59,073 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:45:59,074 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:00,018 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:00,052 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:00,083 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:00,114 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:00,145 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:00,176 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:00,207 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:00,238 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:00,269 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:00,300 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:00,610 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5362281799316406 s; generated tokens: 20 tokens; generate speed: 13.018899315393345 tokens/s +2024-07-30 13:46:00,618 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:00,619 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[23/2067], cost time 1.5512s, every example cost time is 1.5512, generate speed: 12.8934 tokens/s, avg speed: 10.0146 tokens/s, remaining time: 0:43:55 +pred is: + ['The Panthers were designated as the home team in the Super Bowl.'] + label is: + ['Broncos'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:46:00,702 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:00,702 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 79, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:00,703 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:00,703 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:00,703 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:01,644 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:01,677 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:01,707 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:01,738 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:01,768 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:01,799 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:01,830 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:01,860 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:01,891 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:01,921 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:02,228 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.524925708770752 s; generated tokens: 20 tokens; generate speed: 13.11539302207848 tokens/s +2024-07-30 13:46:02,233 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:02,233 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[24/2067], cost time 1.5361s, every example cost time is 1.5361, generate speed: 13.0198 tokens/s, avg speed: 10.1626 tokens/s, remaining time: 0:44:15 +pred is: + ['San Jose State'] + label is: + ['San Jose State'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:46:02,318 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:02,318 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 219, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:02,319 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:02,319 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:02,319 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:03,263 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:03,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:03,326 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:03,358 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:03,394 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:03,425 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:03,457 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:03,488 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:03,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:03,549 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:03,583 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2631936073303223 s; generated tokens: 11 tokens; generate speed: 8.708087134202481 tokens/s +2024-07-30 13:46:03,587 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:03,588 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[25/2067], cost time 1.2749s, every example cost time is 1.2749, generate speed: 8.6283 tokens/s, avg speed: 10.1024 tokens/s, remaining time: 0:44:11 +pred is: + ['2014'] + label is: + ['June 4, 2014'] +The F1/Em of this example is: {'F1': 28.57142857142857, 'Em': 0.0} +2024-07-30 13:46:03,669 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:03,669 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 164, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:03,670 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:03,670 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:03,670 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:04,613 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:04,645 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:04,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:04,679 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0085291862487793 s; generated tokens: 3 tokens; generate speed: 2.974628836631381 tokens/s +2024-07-30 13:46:04,684 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:04,684 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[26/2067], cost time 1.0196s, every example cost time is 1.0196, generate speed: 2.9422 tokens/s, avg speed: 9.8844 tokens/s, remaining time: 0:43:48 +pred is: + ['Gold'] + label is: + ['gold'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:46:04,765 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:04,766 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 179, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:04,766 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:04,766 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:04,767 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:05,709 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:05,742 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:05,774 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:05,806 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:05,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:05,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:05,898 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:05,929 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:05,960 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:05,991 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:06,024 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2570998668670654 s; generated tokens: 11 tokens; generate speed: 8.750299232322819 tokens/s +2024-07-30 13:46:06,029 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:06,029 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[27/2067], cost time 1.2681s, every example cost time is 1.2681, generate speed: 8.6742 tokens/s, avg speed: 9.8402 tokens/s, remaining time: 0:43:45 +pred is: + ['Moscone Center'] + label is: + ['Moscone Center'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:46:06,112 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:06,112 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 144, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:06,112 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:06,113 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:06,113 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:07,055 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:07,089 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:07,120 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:07,151 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:07,182 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:07,213 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:07,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:07,274 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:07,305 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:07,336 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:07,613 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.499924898147583 s; generated tokens: 19 tokens; generate speed: 12.6673008918414 tokens/s +2024-07-30 13:46:07,618 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:07,618 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[28/2067], cost time 1.5111s, every example cost time is 1.5111, generate speed: 12.5733 tokens/s, avg speed: 9.9541 tokens/s, remaining time: 0:44:00 +pred is: + ['Santa Clara University'] + label is: + ['Santa Clara University'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:46:07,702 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:07,702 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 129, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:07,703 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:07,703 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:07,703 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:08,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:08,690 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:08,722 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:08,757 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:08,788 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:08,819 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:08,849 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:08,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:08,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:08,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:09,325 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.621246576309204 s; generated tokens: 20 tokens; generate speed: 12.336186421149055 tokens/s +2024-07-30 13:46:09,329 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:09,330 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[29/2067], cost time 1.6325s, every example cost time is 1.6325, generate speed: 12.2508 tokens/s, avg speed: 10.0530 tokens/s, remaining time: 0:44:23 +pred is: + ['Monday'] + label is: + ['Monday'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:46:09,412 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:09,412 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 136, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:09,413 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:09,413 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:09,413 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:10,360 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:10,403 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:10,434 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:10,465 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:10,496 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:10,527 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:10,558 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:10,589 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:10,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:10,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:10,777 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3636469841003418 s; generated tokens: 14 tokens; generate speed: 10.26658670699618 tokens/s +2024-07-30 13:46:10,782 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:10,782 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[30/2067], cost time 1.3750s, every example cost time is 1.3750, generate speed: 10.1819 tokens/s, avg speed: 10.0575 tokens/s, remaining time: 0:44:26 +pred is: + ['Business Connect'] + label is: + ['Business Connect'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 73.96825396825396, Em score: 70.0, current_count: 30 +2024-07-30 13:46:10,871 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:10,872 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 122, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:10,872 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:10,872 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:10,872 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:11,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:11,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:11,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:11,881 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0084812641143799 s; generated tokens: 3 tokens; generate speed: 2.9747701883529944 tokens/s +2024-07-30 13:46:11,886 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:11,886 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[31/2067], cost time 1.0196s, every example cost time is 1.0196, generate speed: 2.9422 tokens/s, avg speed: 9.8775 tokens/s, remaining time: 0:44:06 +pred is: + ['25'] + label is: + ['25'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:46:11,968 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:11,968 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 129, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:11,968 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:11,969 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:11,969 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:12,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:12,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:12,975 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:13,006 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:13,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:13,068 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:13,115 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:13,147 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:13,178 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:13,209 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:13,524 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5545969009399414 s; generated tokens: 20 tokens; generate speed: 12.865071317141817 tokens/s +2024-07-30 13:46:13,528 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:13,529 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[32/2067], cost time 1.5657s, every example cost time is 1.5657, generate speed: 12.7738 tokens/s, avg speed: 9.9858 tokens/s, remaining time: 0:44:21 +pred is: + ['Vince Lombardi'] + label is: + ['Vince Lombardi'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:46:13,611 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:13,611 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 192, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:13,612 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:13,612 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:13,612 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:14,555 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:14,586 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:14,617 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:14,648 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:14,679 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:14,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:14,741 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:14,772 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:14,803 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:14,834 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:15,143 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5310096740722656 s; generated tokens: 20 tokens; generate speed: 13.06327473869115 tokens/s +2024-07-30 13:46:15,148 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:15,148 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[33/2067], cost time 1.5421s, every example cost time is 1.5421, generate speed: 12.9692 tokens/s, avg speed: 10.0918 tokens/s, remaining time: 0:44:35 +pred is: + ['A'] + label is: + ['CBS'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:46:15,231 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:15,231 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 213, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:15,232 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:15,232 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:15,232 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:16,176 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:16,209 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:16,240 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:16,271 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:16,302 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:16,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:16,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:16,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:16,430 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:16,461 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:16,740 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5078065395355225 s; generated tokens: 19 tokens; generate speed: 12.601086082205825 tokens/s +2024-07-30 13:46:16,745 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:16,745 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[34/2067], cost time 1.5188s, every example cost time is 1.5188, generate speed: 12.5102 tokens/s, avg speed: 10.1736 tokens/s, remaining time: 0:44:45 +pred is: + ['ESPN Deportes'] + label is: + ['ESPN Deportes'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:46:16,833 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:16,833 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 131, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:16,834 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:16,834 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:16,834 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:17,776 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:17,813 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:17,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:17,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:17,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:17,937 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:17,968 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:17,999 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:18,002 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1677100658416748 s; generated tokens: 8 tokens; generate speed: 6.851015705027491 tokens/s +2024-07-30 13:46:18,006 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:18,007 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[35/2067], cost time 1.1789s, every example cost time is 1.1789, generate speed: 6.7862 tokens/s, avg speed: 10.0870 tokens/s, remaining time: 0:44:36 +pred is: + ['NFL Mobile'] + label is: + ['NFL Mobile'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:46:18,089 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:18,090 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 121, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:18,090 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:18,090 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:18,091 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:19,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:19,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:19,095 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:19,126 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:19,157 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:19,187 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:19,218 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:19,249 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:19,280 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:19,311 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:19,625 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5346128940582275 s; generated tokens: 20 tokens; generate speed: 13.032602604498345 tokens/s +2024-07-30 13:46:19,630 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:19,630 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[36/2067], cost time 1.5457s, every example cost time is 1.5457, generate speed: 12.9387 tokens/s, avg speed: 10.1795 tokens/s, remaining time: 0:44:47 +pred is: + ['1'] + label is: + ['The Late Show with Stephen Colbert'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:46:19,713 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:19,713 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 255, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:19,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:19,714 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:19,714 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:20,658 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:20,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:20,722 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:20,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:20,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:20,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:20,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:20,877 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:20,908 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:20,939 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:21,087 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3730363845825195 s; generated tokens: 14 tokens; generate speed: 10.196379467581837 tokens/s +2024-07-30 13:46:21,092 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:21,093 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[37/2067], cost time 1.3844s, every example cost time is 1.3844, generate speed: 10.1127 tokens/s, avg speed: 10.1776 tokens/s, remaining time: 0:44:49 +pred is: + ['$5,000,000'] + label is: + ['$5,000,000'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:46:21,175 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:21,175 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 100, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:21,175 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:21,176 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:21,176 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:22,117 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:22,151 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:22,182 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:22,213 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:22,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:22,275 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:22,306 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:22,337 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:22,367 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:22,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:22,707 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5306034088134766 s; generated tokens: 20 tokens; generate speed: 13.066742099773576 tokens/s +2024-07-30 13:46:22,711 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:22,712 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[38/2067], cost time 1.5418s, every example cost time is 1.5418, generate speed: 12.9722 tokens/s, avg speed: 10.2628 tokens/s, remaining time: 0:45:00 +pred is: + ['Small Business Big Game'] + label is: + ['"Small Business Big Game"'] +The F1/Em of this example is: {'F1': 87.50000000000001, 'Em': 0.0} +2024-07-30 13:46:22,793 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:22,794 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 165, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:22,794 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:22,794 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:22,795 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:23,737 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:23,770 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:23,801 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:23,832 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:23,863 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:23,894 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:23,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:23,955 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:23,986 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:24,017 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:24,343 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5477488040924072 s; generated tokens: 20 tokens; generate speed: 12.921993508971184 tokens/s +2024-07-30 13:46:24,347 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:24,348 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[39/2067], cost time 1.5590s, every example cost time is 1.5590, generate speed: 12.8284 tokens/s, avg speed: 10.3395 tokens/s, remaining time: 0:45:10 +pred is: + ['The Secret Life of Pets'] + label is: + ['Jason Bourne'] +The F1/Em of this example is: {'F1': 16.666666666666664, 'Em': 0.0} +2024-07-30 13:46:24,430 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:24,430 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 103, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:24,431 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:24,431 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:24,431 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:25,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:25,405 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:25,436 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:25,467 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:25,498 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:25,529 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:25,559 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:25,590 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:25,621 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:25,652 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:25,868 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.436220407485962 s; generated tokens: 17 tokens; generate speed: 11.836623342344593 tokens/s +2024-07-30 13:46:25,872 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:25,873 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[40/2067], cost time 1.4474s, every example cost time is 1.4474, generate speed: 11.7449 tokens/s, avg speed: 10.3775 tokens/s, remaining time: 0:45:15 +pred is: + ['Westwood One'] + label is: + ['Westwood One'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 73.08035714285714, Em score: 67.5, current_count: 40 +2024-07-30 13:46:25,963 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:25,963 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 258, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:25,964 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:25,964 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:25,964 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:26,930 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:26,964 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:26,995 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:27,026 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:27,029 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.065061330795288 s; generated tokens: 4 tokens; generate speed: 3.7556522655959865 tokens/s +2024-07-30 13:46:27,034 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:27,034 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[41/2067], cost time 1.0762s, every example cost time is 1.0762, generate speed: 3.7168 tokens/s, avg speed: 10.2463 tokens/s, remaining time: 0:45:00 +pred is: + ['KRFX'] + label is: + ['KRFX'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:46:27,117 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:27,117 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 95, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:27,117 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:27,118 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:27,118 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:28,060 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:28,093 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:28,124 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:28,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:28,185 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:28,216 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:28,247 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:28,278 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:28,308 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:28,339 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:28,647 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5284852981567383 s; generated tokens: 20 tokens; generate speed: 13.084849441547657 tokens/s +2024-07-30 13:46:28,651 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:28,651 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[42/2067], cost time 1.5396s, every example cost time is 1.5396, generate speed: 12.9907 tokens/s, avg speed: 10.3215 tokens/s, remaining time: 0:45:09 +pred is: + ['BBC Radio 5 Live'] + label is: + ['BBC Radio 5'] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +2024-07-30 13:46:28,734 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:28,734 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 166, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:28,735 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:28,735 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:28,735 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:29,678 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:29,734 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:29,766 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:29,798 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:29,829 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:29,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:29,890 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:29,922 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:29,952 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:29,983 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:30,293 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5581939220428467 s; generated tokens: 20 tokens; generate speed: 12.835372874371954 tokens/s +2024-07-30 13:46:30,298 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:30,298 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[43/2067], cost time 1.5694s, every example cost time is 1.5694, generate speed: 12.7440 tokens/s, avg speed: 10.3873 tokens/s, remaining time: 0:45:18 +pred is: + ['Bart Starr'] + label is: + ['Bart Starr'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:46:30,381 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:30,382 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 80, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:30,382 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:30,382 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:30,382 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:31,324 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:31,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:31,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:31,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:31,452 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:31,483 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:31,514 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:31,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:31,634 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:31,666 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:31,946 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.563317060470581 s; generated tokens: 19 tokens; generate speed: 12.153644631934565 tokens/s +2024-07-30 13:46:31,951 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:31,951 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[44/2067], cost time 1.5745s, every example cost time is 1.5745, generate speed: 12.0676 tokens/s, avg speed: 10.4319 tokens/s, remaining time: 0:45:28 +pred is: + ['Six'] + label is: + ['Six'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:46:32,033 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:32,033 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:32,033 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:32,034 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:32,034 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:32,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:33,009 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:33,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:33,071 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:33,101 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:33,132 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:33,163 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:33,193 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:33,224 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:33,255 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:33,565 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5310125350952148 s; generated tokens: 20 tokens; generate speed: 13.063250327180493 tokens/s +2024-07-30 13:46:33,570 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:33,570 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[45/2067], cost time 1.5422s, every example cost time is 1.5422, generate speed: 12.9682 tokens/s, avg speed: 10.4962 tokens/s, remaining time: 0:45:35 +pred is: + ['December 3, 2015'] + label is: + ['December 3'] +The F1/Em of this example is: {'F1': 66.66666666666666, 'Em': 0.0} +2024-07-30 13:46:33,652 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:33,652 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 193, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:33,653 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:33,653 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:33,653 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:34,596 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:34,629 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:34,660 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:34,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:34,722 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:34,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:34,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:34,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:34,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:34,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:35,002 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3489713668823242 s; generated tokens: 14 tokens; generate speed: 10.378278104120257 tokens/s +2024-07-30 13:46:35,007 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:35,007 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[46/2067], cost time 1.3600s, every example cost time is 1.3600, generate speed: 10.2943 tokens/s, avg speed: 10.4918 tokens/s, remaining time: 0:45:34 +pred is: + ['Carolina Panthers'] + label is: + ['Denver'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:46:35,089 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:35,089 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 199, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:35,090 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:35,090 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:35,090 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:36,033 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:36,066 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:36,097 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:36,128 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:36,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:36,190 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:36,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:36,252 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:36,283 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:36,286 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.195338249206543 s; generated tokens: 9 tokens; generate speed: 7.5292495709679965 tokens/s +2024-07-30 13:46:36,290 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:36,291 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[47/2067], cost time 1.2064s, every example cost time is 1.2064, generate speed: 7.4601 tokens/s, avg speed: 10.4341 tokens/s, remaining time: 0:45:26 +pred is: + ['Mike Carey'] + label is: + ['Mike Carey'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:46:36,373 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:36,373 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 252, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:36,374 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:36,374 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:36,374 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:37,318 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:37,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:37,382 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:37,413 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:37,443 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:37,474 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:37,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:37,537 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:37,568 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:37,571 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1960604190826416 s; generated tokens: 9 tokens; generate speed: 7.524703481871635 tokens/s +2024-07-30 13:46:37,575 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:37,575 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[48/2067], cost time 1.2072s, every example cost time is 1.2072, generate speed: 7.4553 tokens/s, avg speed: 10.3785 tokens/s, remaining time: 0:45:19 +pred is: + ['Jonathan Stewart'] + label is: + ['Jonathan Stewart'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:46:37,658 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:37,658 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 187, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:37,659 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:37,659 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:37,659 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:38,602 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:38,634 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:38,665 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:38,696 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:38,727 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:38,757 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:38,788 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:38,819 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:38,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:38,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:39,195 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5360281467437744 s; generated tokens: 20 tokens; generate speed: 13.02059473480222 tokens/s +2024-07-30 13:46:39,200 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:39,200 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[49/2067], cost time 1.5473s, every example cost time is 1.5473, generate speed: 12.9260 tokens/s, avg speed: 10.4380 tokens/s, remaining time: 0:45:26 +pred is: + ['Darian Stewart'] + label is: + ['Darian Stewart'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:46:39,283 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:39,283 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 258, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:39,283 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:39,284 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:39,284 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:40,228 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:40,262 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:40,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:40,326 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:40,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:40,389 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:40,429 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:40,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:40,491 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:40,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:40,617 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3330984115600586 s; generated tokens: 13 tokens; generate speed: 9.75171816819341 tokens/s +2024-07-30 13:46:40,622 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:40,622 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[50/2067], cost time 1.3442s, every example cost time is 1.3442, generate speed: 9.6711 tokens/s, avg speed: 10.4228 tokens/s, remaining time: 0:45:24 +pred is: + ['Ted Ginn Jr.'] + label is: + ['Ted Ginn Jr.'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 75.46428571428571, Em score: 68.0, current_count: 50 +2024-07-30 13:46:40,715 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:40,716 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 166, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:40,716 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:40,716 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:40,716 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:41,658 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:41,690 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:41,721 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:41,762 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:41,765 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0486233234405518 s; generated tokens: 4 tokens; generate speed: 3.8145251117206977 tokens/s +2024-07-30 13:46:41,770 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:41,770 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[51/2067], cost time 1.0598s, every example cost time is 1.0598, generate speed: 3.7744 tokens/s, avg speed: 10.3201 tokens/s, remaining time: 0:45:11 +pred is: + ['Ealy'] + label is: + ['Ealy'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:46:41,852 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:41,852 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 265, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:41,852 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:41,853 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:41,853 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:42,797 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:42,830 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:42,861 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:42,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:42,928 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:42,960 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:42,991 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:43,022 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:43,053 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:43,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:43,331 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.478447675704956 s; generated tokens: 18 tokens; generate speed: 12.174932055960118 tokens/s +2024-07-30 13:46:43,336 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:43,336 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[52/2067], cost time 1.4895s, every example cost time is 1.4895, generate speed: 12.0844 tokens/s, avg speed: 10.3576 tokens/s, remaining time: 0:45:16 +pred is: + ['24'] + label is: + ['24'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:46:43,419 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:43,419 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 315, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:43,419 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:43,420 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:43,420 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:44,364 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:44,397 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:44,428 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:44,459 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:44,490 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:44,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:44,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:44,585 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:44,616 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:44,647 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:44,680 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.260134220123291 s; generated tokens: 11 tokens; generate speed: 8.729228858592352 tokens/s +2024-07-30 13:46:44,685 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:44,685 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[53/2067], cost time 1.2712s, every example cost time is 1.2712, generate speed: 8.6531 tokens/s, avg speed: 10.3272 tokens/s, remaining time: 0:45:11 +pred is: + ['2.5'] + label is: + ['five'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:46:44,767 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:44,767 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 357, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:44,767 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:44,768 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:44,768 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:45,713 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:45,746 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:45,777 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:45,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:45,839 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:45,870 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:45,901 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:45,932 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:45,962 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:45,965 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1971173286437988 s; generated tokens: 9 tokens; generate speed: 7.5180600803732425 tokens/s +2024-07-30 13:46:45,970 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:45,970 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[54/2067], cost time 1.2082s, every example cost time is 1.2082, generate speed: 7.4492 tokens/s, avg speed: 10.2793 tokens/s, remaining time: 0:45:05 +pred is: + ['194'] + label is: + ['194'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:46:46,051 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:46,051 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 176, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:46,052 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:46,052 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:46,052 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:46,995 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:47,028 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:47,059 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:47,090 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:47,121 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:47,123 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0707955360412598 s; generated tokens: 5 tokens; generate speed: 4.669425517484918 tokens/s +2024-07-30 13:46:47,128 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:47,128 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[55/2067], cost time 1.0818s, every example cost time is 1.0818, generate speed: 4.6217 tokens/s, avg speed: 10.1962 tokens/s, remaining time: 0:44:54 +pred is: + ['Nobel Prize'] + label is: + ['Nobel Prize'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:46:47,217 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:47,217 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 434, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:47,218 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:47,218 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:47,218 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:48,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:48,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:48,228 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:48,271 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:48,302 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:48,333 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:48,370 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:48,401 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:48,433 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:48,464 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:48,773 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5547373294830322 s; generated tokens: 20 tokens; generate speed: 12.8639093052781 tokens/s +2024-07-30 13:46:48,778 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:48,778 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[56/2067], cost time 1.5661s, every example cost time is 1.5661, generate speed: 12.7707 tokens/s, avg speed: 10.2498 tokens/s, remaining time: 0:45:01 +pred is: + ['100'] + label is: + ['100'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:46:48,866 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:48,867 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 204, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:48,867 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:48,867 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:48,868 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:49,811 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:49,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:49,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:49,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:49,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:49,969 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:50,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:50,034 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:50,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:50,095 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:50,421 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5526502132415771 s; generated tokens: 20 tokens; generate speed: 12.881201335260561 tokens/s +2024-07-30 13:46:50,425 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:50,425 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[57/2067], cost time 1.5640s, every example cost time is 1.5640, generate speed: 12.7875 tokens/s, avg speed: 10.3015 tokens/s, remaining time: 0:45:07 +pred is: + ['15 kilometres (9 miles)'] + label is: + ['15 kilometres'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:46:50,514 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:50,515 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 214, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:50,515 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:50,516 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:50,516 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:51,459 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:51,492 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:51,523 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:51,554 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:51,585 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:51,616 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:51,650 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:51,682 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:51,713 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:51,744 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:52,053 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.536836862564087 s; generated tokens: 20 tokens; generate speed: 13.013743024507905 tokens/s +2024-07-30 13:46:52,057 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:52,058 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[58/2067], cost time 1.5483s, every example cost time is 1.5483, generate speed: 12.9173 tokens/s, avg speed: 10.3532 tokens/s, remaining time: 0:45:13 +pred is: + ['Demographically'] + label is: + ['city'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:46:52,155 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:52,156 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:52,156 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:52,157 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:52,157 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:53,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:53,132 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:53,163 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:53,194 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:53,224 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:53,255 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:53,286 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:53,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:53,348 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:53,380 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:53,444 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.28721022605896 s; generated tokens: 12 tokens; generate speed: 9.322486534884277 tokens/s +2024-07-30 13:46:53,449 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:53,449 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[59/2067], cost time 1.2990s, every example cost time is 1.2990, generate speed: 9.2376 tokens/s, avg speed: 10.3350 tokens/s, remaining time: 0:45:10 +pred is: + ['Warsaw University of Technology'] + label is: + ['Warsaw University of Technology'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:46:53,531 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:53,532 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 191, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:53,532 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:53,532 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:53,533 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:54,475 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:54,507 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:54,539 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:54,571 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:54,602 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:54,633 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:54,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:54,695 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:54,726 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:54,757 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:55,070 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5372262001037598 s; generated tokens: 20 tokens; generate speed: 13.010446997748307 tokens/s +2024-07-30 13:46:55,075 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:55,076 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[60/2067], cost time 1.5490s, every example cost time is 1.5490, generate speed: 12.9118 tokens/s, avg speed: 10.3842 tokens/s, remaining time: 0:45:15 +pred is: + ['1816'] + label is: + ['1816'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 75.38690476190476, Em score: 68.33333333333333, current_count: 60 +2024-07-30 13:46:55,170 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:55,171 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 159, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:55,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:55,171 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:55,172 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:56,114 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:56,147 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:56,178 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:56,209 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:56,240 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:56,271 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:56,302 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:56,333 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:56,364 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:56,395 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:56,703 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5314075946807861 s; generated tokens: 20 tokens; generate speed: 13.05988038029085 tokens/s +2024-07-30 13:46:56,708 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:56,708 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[61/2067], cost time 1.5431s, every example cost time is 1.5431, generate speed: 12.9612 tokens/s, avg speed: 10.4322 tokens/s, remaining time: 0:45:20 +pred is: + ['Infrastructure'] + label is: + ['infrastructure'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:46:56,790 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:56,790 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 183, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:56,791 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:56,791 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:56,791 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:57,733 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:57,766 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:57,797 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:57,828 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:57,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:57,890 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:57,921 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:57,952 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:57,983 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:58,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:58,327 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5360846519470215 s; generated tokens: 20 tokens; generate speed: 13.02011576943338 tokens/s +2024-07-30 13:46:58,332 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:58,333 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[62/2067], cost time 1.5477s, every example cost time is 1.5477, generate speed: 12.9227 tokens/s, avg speed: 10.4780 tokens/s, remaining time: 0:45:25 +pred is: + ['Warsaw'] + label is: + ['Warsaw'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:46:58,414 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:58,415 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 175, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:58,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:58,415 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:58,416 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:46:59,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:59,432 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:59,466 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:59,497 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:59,500 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.084397315979004 s; generated tokens: 4 tokens; generate speed: 3.6886848953409324 tokens/s +2024-07-30 13:46:59,505 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:46:59,505 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[63/2067], cost time 1.0957s, every example cost time is 1.0957, generate speed: 3.6507 tokens/s, avg speed: 10.3903 tokens/s, remaining time: 0:45:15 +pred is: + ['Music theatre'] + label is: + ['musical'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:46:59,587 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:46:59,588 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:46:59,588 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:46:59,588 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:46:59,589 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:00,531 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:00,563 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:00,619 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:00,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:00,682 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:00,713 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:00,743 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:00,774 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:00,805 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:00,835 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:01,143 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5547566413879395 s; generated tokens: 20 tokens; generate speed: 12.863749520404617 tokens/s +2024-07-30 13:47:01,148 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:01,149 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[64/2067], cost time 1.5660s, every example cost time is 1.5660, generate speed: 12.7714 tokens/s, avg speed: 10.4332 tokens/s, remaining time: 0:45:20 +pred is: + ['Ogród Saski'] + label is: + ['Ogród Saski'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:47:01,231 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:01,231 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 215, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:01,232 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:01,232 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:01,232 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:02,175 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:02,208 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:02,239 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:02,269 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:02,300 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:02,303 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0705268383026123 s; generated tokens: 5 tokens; generate speed: 4.670597523671443 tokens/s +2024-07-30 13:47:02,307 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:02,308 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[65/2067], cost time 1.0816s, every example cost time is 1.0816, generate speed: 4.6229 tokens/s, avg speed: 10.3618 tokens/s, remaining time: 0:45:10 +pred is: + ['Wianki'] + label is: + ['Wianki'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:47:02,389 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:02,389 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 170, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:02,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:02,390 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:02,390 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:03,332 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:03,364 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:03,395 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:03,426 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:03,457 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:03,487 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:03,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:03,549 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:03,580 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:03,611 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:03,969 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5791864395141602 s; generated tokens: 20 tokens; generate speed: 12.66474907557656 tokens/s +2024-07-30 13:47:03,974 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:03,975 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[66/2067], cost time 1.5904s, every example cost time is 1.5904, generate speed: 12.5751 tokens/s, avg speed: 10.4011 tokens/s, remaining time: 0:45:16 +pred is: + ['Art posters'] + label is: + ['art posters'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:47:04,057 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:04,057 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 154, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:04,058 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:04,058 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:04,058 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:05,000 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:05,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:05,063 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:05,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:05,125 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:05,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:05,186 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:05,189 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1302528381347656 s; generated tokens: 7 tokens; generate speed: 6.1933045101235615 tokens/s +2024-07-30 13:47:05,193 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:05,194 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[67/2067], cost time 1.1414s, every example cost time is 1.1414, generate speed: 6.1330 tokens/s, avg speed: 10.3474 tokens/s, remaining time: 0:45:08 +pred is: + ['Warsaw Uprising Museum'] + label is: + ['Warsaw Uprising Museum'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:47:05,275 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:05,275 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 153, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:05,276 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:05,276 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:05,276 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:06,217 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:06,249 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:06,280 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:06,311 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:06,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:06,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:06,403 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:06,434 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:06,465 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:06,496 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:06,804 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5275630950927734 s; generated tokens: 20 tokens; generate speed: 13.092748878425438 tokens/s +2024-07-30 13:47:06,808 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:06,809 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[68/2067], cost time 1.5387s, every example cost time is 1.5387, generate speed: 12.9979 tokens/s, avg speed: 10.3916 tokens/s, remaining time: 0:45:12 +pred is: + ['Ujazdów Castle'] + label is: + ['Royal Ujazdów Castle'] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +2024-07-30 13:47:06,891 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:06,891 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 183, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:06,891 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:06,892 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:06,892 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:07,834 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:07,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:07,899 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:07,930 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:07,960 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:07,991 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:08,022 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:08,053 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:08,083 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:08,114 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:08,440 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5483460426330566 s; generated tokens: 20 tokens; generate speed: 12.917009149962874 tokens/s +2024-07-30 13:47:08,445 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:08,445 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[69/2067], cost time 1.5596s, every example cost time is 1.5596, generate speed: 12.8241 tokens/s, avg speed: 10.4320 tokens/s, remaining time: 0:45:17 +pred is: + ['Polonia Warsaw'] + label is: + ['Polonia Warsaw'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:47:08,528 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:08,529 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 184, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:08,529 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:08,529 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:08,529 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:09,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:09,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:09,536 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:09,568 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:09,571 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0414884090423584 s; generated tokens: 4 tokens; generate speed: 3.840657241378205 tokens/s +2024-07-30 13:47:09,576 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:09,576 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[70/2067], cost time 1.0528s, every example cost time is 1.0528, generate speed: 3.7996 tokens/s, avg speed: 10.3585 tokens/s, remaining time: 0:45:07 +pred is: + ['syrenka'] + label is: + ['syrenka'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 77.23639455782313, Em score: 70.0, current_count: 70 +2024-07-30 13:47:09,672 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:09,672 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 187, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:09,673 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:09,673 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:09,673 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:10,616 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:10,648 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:10,679 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:10,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:10,740 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:10,771 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:10,802 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:10,832 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:10,863 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:10,925 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:11,234 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5604753494262695 s; generated tokens: 20 tokens; generate speed: 12.816607457050365 tokens/s +2024-07-30 13:47:11,239 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:11,239 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[71/2067], cost time 1.5716s, every example cost time is 1.5716, generate speed: 12.7256 tokens/s, avg speed: 10.3970 tokens/s, remaining time: 0:45:12 +pred is: + ['A legend'] + label is: + ['legend'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:47:11,321 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:11,321 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 210, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:11,322 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:11,322 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:11,322 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:12,265 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:12,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:12,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:12,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:12,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:12,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:12,451 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:12,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:12,513 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:12,544 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:12,874 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5511925220489502 s; generated tokens: 20 tokens; generate speed: 12.893306095611045 tokens/s +2024-07-30 13:47:12,878 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:12,879 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[72/2067], cost time 1.5623s, every example cost time is 1.5623, generate speed: 12.8016 tokens/s, avg speed: 10.4353 tokens/s, remaining time: 0:45:16 +pred is: + ['1'] + label is: + ['Warsaw'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:47:12,961 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:12,961 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 268, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:12,962 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:12,962 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:12,962 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:13,906 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:13,939 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:13,969 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:14,000 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:14,031 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:14,061 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:14,092 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:14,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:14,153 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:14,184 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:14,518 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5555534362792969 s; generated tokens: 20 tokens; generate speed: 12.857160373633757 tokens/s +2024-07-30 13:47:14,523 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:14,523 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[73/2067], cost time 1.5668s, every example cost time is 1.5668, generate speed: 12.7651 tokens/s, avg speed: 10.4720 tokens/s, remaining time: 0:45:20 +pred is: + ['Economist Intelligence Unit'] + label is: + ['Economist Intelligence Unit'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:47:14,605 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:14,605 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 394, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:14,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:14,606 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:14,606 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:15,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:15,585 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:15,616 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:15,647 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:15,650 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0431628227233887 s; generated tokens: 4 tokens; generate speed: 3.834492480816357 tokens/s +2024-07-30 13:47:15,654 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:15,655 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[74/2067], cost time 1.0541s, every example cost time is 1.0541, generate speed: 3.7947 tokens/s, avg speed: 10.4021 tokens/s, remaining time: 0:45:10 +pred is: + ['1313'] + label is: + ['1313'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:47:15,736 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:15,737 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 232, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:15,737 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:15,737 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:15,737 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:16,681 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:16,713 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:16,744 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:16,775 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:16,806 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:16,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:16,867 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:16,898 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:16,929 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:16,959 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:17,291 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5534133911132812 s; generated tokens: 20 tokens; generate speed: 12.874872918191238 tokens/s +2024-07-30 13:47:17,296 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:17,296 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[75/2067], cost time 1.5645s, every example cost time is 1.5645, generate speed: 12.7836 tokens/s, avg speed: 10.4385 tokens/s, remaining time: 0:45:14 +pred is: + ['Roman Catholic'] + label is: + ['Roman Catholic'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:47:17,408 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:17,408 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 285, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:17,409 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:17,409 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:17,409 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:18,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:18,386 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:18,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:18,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:18,479 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:18,510 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:18,541 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:18,571 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:18,602 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:18,633 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:18,666 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.257000207901001 s; generated tokens: 11 tokens; generate speed: 8.750992983818456 tokens/s +2024-07-30 13:47:18,671 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:18,671 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[76/2067], cost time 1.2687s, every example cost time is 1.2687, generate speed: 8.6705 tokens/s, avg speed: 10.4168 tokens/s, remaining time: 0:45:11 +pred is: + ['Warszawa'] + label is: + ['Warszawa'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:47:18,753 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:18,753 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 239, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:18,754 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:18,754 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:18,754 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:19,698 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:19,730 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:19,761 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:19,792 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:19,823 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:19,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:19,885 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:19,916 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:19,946 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:19,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:20,285 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5308656692504883 s; generated tokens: 20 tokens; generate speed: 13.06450356927267 tokens/s +2024-07-30 13:47:20,290 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:20,290 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[77/2067], cost time 1.5420s, every example cost time is 1.5420, generate speed: 12.9702 tokens/s, avg speed: 10.4543 tokens/s, remaining time: 0:45:14 +pred is: + ['Jazdów'] + label is: + ['Jazdów'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:47:20,373 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:20,373 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 231, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:20,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:20,374 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:20,374 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:21,318 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:21,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:21,381 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:21,412 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:21,443 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:21,474 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:21,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:21,536 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:21,567 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:21,598 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:21,908 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5342473983764648 s; generated tokens: 20 tokens; generate speed: 13.035707292815962 tokens/s +2024-07-30 13:47:21,913 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:21,913 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[78/2067], cost time 1.5456s, every example cost time is 1.5456, generate speed: 12.9403 tokens/s, avg speed: 10.4904 tokens/s, remaining time: 0:45:17 +pred is: + ['The General Sejm'] + label is: + ['General Sejm'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 13:47:21,995 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:21,996 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 162, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:21,996 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:21,997 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:21,997 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:22,945 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:22,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:23,008 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:23,039 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:23,070 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:23,101 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:23,133 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:23,175 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:23,206 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:23,237 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:23,552 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5550973415374756 s; generated tokens: 20 tokens; generate speed: 12.86093125220485 tokens/s +2024-07-30 13:47:23,557 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:23,557 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[79/2067], cost time 1.5665s, every example cost time is 1.5665, generate speed: 12.7670 tokens/s, avg speed: 10.5234 tokens/s, remaining time: 0:45:21 +pred is: + ['179 years'] + label is: + ['until 1796'] +The F1/Em of this example is: {'F1': 33.33333333333333, 'Em': 0.0} +2024-07-30 13:47:23,639 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:23,639 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 193, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:23,640 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:23,640 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:23,640 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:24,583 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:24,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:24,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:24,677 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:24,709 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:24,740 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:24,770 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:24,773 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1331753730773926 s; generated tokens: 7 tokens; generate speed: 6.177331564301407 tokens/s +2024-07-30 13:47:24,778 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:24,778 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[80/2067], cost time 1.1444s, every example cost time is 1.1444, generate speed: 6.1170 tokens/s, avg speed: 10.4772 tokens/s, remaining time: 0:45:14 +pred is: + ['1915-1918'] + label is: + ['from 4 August 1915 until November 1918'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 75.8110119047619, Em score: 67.5, current_count: 80 +2024-07-30 13:47:24,877 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:24,877 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 228, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:24,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:24,878 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:24,878 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:25,822 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:25,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:25,885 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:25,916 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:25,947 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:25,978 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:26,009 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:26,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:26,071 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:26,102 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:26,413 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5342402458190918 s; generated tokens: 20 tokens; generate speed: 13.035768064683056 tokens/s +2024-07-30 13:47:26,425 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:26,425 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[81/2067], cost time 1.5531s, every example cost time is 1.5531, generate speed: 12.8771 tokens/s, avg speed: 10.5109 tokens/s, remaining time: 0:45:17 +pred is: + ['1 September 1939'] + label is: + ['September 1939'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 13:47:26,508 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:26,508 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 222, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:26,508 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:26,509 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:26,509 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:27,452 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:27,485 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:27,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:27,548 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:27,579 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:27,610 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:27,643 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:27,674 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:27,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:27,736 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:28,052 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5430755615234375 s; generated tokens: 20 tokens; generate speed: 12.961128086465534 tokens/s +2024-07-30 13:47:28,057 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:28,057 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[82/2067], cost time 1.5546s, every example cost time is 1.5546, generate speed: 12.8653 tokens/s, avg speed: 10.5434 tokens/s, remaining time: 0:45:20 +pred is: + ['Red Army'] + label is: + ['the Red Army'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 13:47:28,139 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:28,140 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 178, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:28,140 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:28,140 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:28,140 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:29,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:29,116 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:29,148 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:29,178 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:29,209 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:29,240 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:29,271 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:29,302 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:29,333 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:29,335 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1946566104888916 s; generated tokens: 9 tokens; generate speed: 7.533545556925277 tokens/s +2024-07-30 13:47:29,340 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:29,340 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[83/2067], cost time 1.2059s, every example cost time is 1.2059, generate speed: 7.4633 tokens/s, avg speed: 10.5107 tokens/s, remaining time: 0:45:15 +pred is: + ['"Bricks for Warsaw" campaign'] + label is: + ['"Bricks for Warsaw"'] +The F1/Em of this example is: {'F1': 87.50000000000001, 'Em': 0.0} +2024-07-30 13:47:29,438 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:29,438 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 160, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:29,438 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:29,439 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:29,439 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:30,382 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:30,416 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:30,447 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:30,478 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:30,481 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0416898727416992 s; generated tokens: 4 tokens; generate speed: 3.8399144550307565 tokens/s +2024-07-30 13:47:30,486 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:30,486 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[84/2067], cost time 1.0534s, every example cost time is 1.0534, generate speed: 3.7971 tokens/s, avg speed: 10.4490 tokens/s, remaining time: 0:45:06 +pred is: + ['John Paul II'] + label is: + ['John Paul II'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:47:30,568 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:30,568 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 307, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:30,569 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:30,569 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:30,569 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:31,514 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:31,546 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:31,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:31,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:31,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:31,670 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:31,701 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:31,732 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:31,771 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:31,802 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:32,111 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.541196584701538 s; generated tokens: 20 tokens; generate speed: 12.97692987288388 tokens/s +2024-07-30 13:47:32,116 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:32,116 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[85/2067], cost time 1.5527s, every example cost time is 1.5527, generate speed: 12.8804 tokens/s, avg speed: 10.4815 tokens/s, remaining time: 0:45:09 +pred is: + ['300'] + label is: + ['about 300'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:47:32,198 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:32,198 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 253, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:32,198 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:32,199 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:32,199 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:33,144 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:33,176 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:33,207 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:33,210 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.011084794998169 s; generated tokens: 3 tokens; generate speed: 2.9671101917870626 tokens/s +2024-07-30 13:47:33,215 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:33,215 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[86/2067], cost time 1.0225s, every example cost time is 1.0225, generate speed: 2.9341 tokens/s, avg speed: 10.4157 tokens/s, remaining time: 0:45:00 +pred is: + ['2'] + label is: + ['two'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:47:33,297 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:33,297 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 235, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:33,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:33,298 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:33,298 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:34,242 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:34,276 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:34,308 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:34,339 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:34,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:34,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:34,431 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:34,434 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1355960369110107 s; generated tokens: 7 tokens; generate speed: 6.164163815718339 tokens/s +2024-07-30 13:47:34,438 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:34,439 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[87/2067], cost time 1.1466s, every example cost time is 1.1466, generate speed: 6.1048 tokens/s, avg speed: 10.3739 tokens/s, remaining time: 0:44:54 +pred is: + ['The plain moraine plateau'] + label is: + ['moraine'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 13:47:34,520 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:34,520 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 174, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:34,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:34,521 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:34,521 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:35,464 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:35,497 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:35,529 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:35,560 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:35,591 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:35,621 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:35,652 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:35,684 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:35,715 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:35,746 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:36,054 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5329062938690186 s; generated tokens: 20 tokens; generate speed: 13.04711193371154 tokens/s +2024-07-30 13:47:36,059 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:36,060 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[88/2067], cost time 1.5443s, every example cost time is 1.5443, generate speed: 12.9508 tokens/s, avg speed: 10.4071 tokens/s, remaining time: 0:44:56 +pred is: + ['1'] + label is: + ['turbulent history of the city'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:47:36,144 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:36,145 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 268, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:36,145 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:36,145 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:36,145 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:37,090 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:37,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:37,161 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:37,192 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:37,253 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:37,285 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:37,288 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1423683166503906 s; generated tokens: 6 tokens; generate speed: 5.252246506269514 tokens/s +2024-07-30 13:47:37,293 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:37,293 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[89/2067], cost time 1.1538s, every example cost time is 1.1538, generate speed: 5.2004 tokens/s, avg speed: 10.3575 tokens/s, remaining time: 0:44:50 +pred is: + ['Gothic architecture'] + label is: + ['Gothic'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:47:37,374 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:37,375 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 320, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:37,375 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:37,375 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:37,376 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:38,327 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:38,426 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:38,459 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:38,491 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:38,523 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:38,526 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1505510807037354 s; generated tokens: 5 tokens; generate speed: 4.345743603962152 tokens/s +2024-07-30 13:47:38,531 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:38,531 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[90/2067], cost time 1.1617s, every example cost time is 1.1617, generate speed: 4.3039 tokens/s, avg speed: 10.3000 tokens/s, remaining time: 0:44:45 +pred is: + ['17th century'] + label is: + ['17th century'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 73.63756613756614, Em score: 62.22222222222222, current_count: 90 +2024-07-30 13:47:38,632 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:38,633 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 199, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:38,633 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:38,633 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:38,634 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:39,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:39,614 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:39,618 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 0.9838385581970215 s; generated tokens: 2 tokens; generate speed: 2.032853849177442 tokens/s +2024-07-30 13:47:39,622 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:39,622 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[91/2067], cost time 0.9949s, every example cost time is 0.9949, generate speed: 2.0103 tokens/s, avg speed: 10.2330 tokens/s, remaining time: 0:44:35 +pred is: + ['A'] + label is: + ['bourgeois'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:47:39,705 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:39,705 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 200, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:39,706 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:39,706 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:39,706 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:40,648 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:40,680 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:40,711 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:40,743 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:40,774 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:40,805 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:40,836 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:40,867 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:40,898 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:40,929 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:41,085 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.379180908203125 s; generated tokens: 15 tokens; generate speed: 10.876020622662802 tokens/s +2024-07-30 13:47:41,090 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:41,090 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[92/2067], cost time 1.3902s, every example cost time is 1.3902, generate speed: 10.7899 tokens/s, avg speed: 10.2393 tokens/s, remaining time: 0:44:35 +pred is: + ['There are also many places commemorating the heroic history of Warsaw.'] + label is: + ['many places'] +The F1/Em of this example is: {'F1': 24.000000000000004, 'Em': 0.0} +2024-07-30 13:47:41,172 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:41,172 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 265, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:41,173 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:41,173 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:41,173 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:42,117 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:42,151 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:42,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:42,214 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:42,245 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:42,248 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0746924877166748 s; generated tokens: 5 tokens; generate speed: 4.652493673444351 tokens/s +2024-07-30 13:47:42,252 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:42,253 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[93/2067], cost time 1.0857s, every example cost time is 1.0857, generate speed: 4.6052 tokens/s, avg speed: 10.1906 tokens/s, remaining time: 0:44:28 +pred is: + ['Botanical garden'] + label is: + ['green'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:47:42,334 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:42,334 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 240, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:42,335 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:42,335 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:42,335 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:43,279 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:43,311 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:43,343 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:43,374 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:43,404 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:43,435 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:43,466 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:43,497 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:43,528 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:43,559 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:43,889 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5535824298858643 s; generated tokens: 20 tokens; generate speed: 12.873472057397896 tokens/s +2024-07-30 13:47:43,894 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:43,894 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[94/2067], cost time 1.5647s, every example cost time is 1.5647, generate speed: 12.7817 tokens/s, avg speed: 10.2225 tokens/s, remaining time: 0:44:31 +pred is: + ['1'] + label is: + ['location of Warsaw'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:47:43,977 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:43,977 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 246, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:43,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:43,977 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:43,978 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:44,922 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:44,955 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:44,986 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:45,018 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:45,049 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:45,080 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:45,111 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:45,142 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:45,173 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:45,204 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:45,514 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5357334613800049 s; generated tokens: 20 tokens; generate speed: 13.02309320136065 tokens/s +2024-07-30 13:47:45,518 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:45,519 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[95/2067], cost time 1.5468s, every example cost time is 1.5468, generate speed: 12.9295 tokens/s, avg speed: 10.2550 tokens/s, remaining time: 0:44:33 +pred is: + ['1,300,000'] + label is: + ['1,300,000'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:47:45,600 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:45,601 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 214, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:45,601 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:45,601 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:45,601 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:46,544 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:46,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:46,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:46,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:46,642 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0407202243804932 s; generated tokens: 4 tokens; generate speed: 3.843492137746309 tokens/s +2024-07-30 13:47:46,647 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:46,647 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[96/2067], cost time 1.0517s, every example cost time is 1.0517, generate speed: 3.8034 tokens/s, avg speed: 10.2027 tokens/s, remaining time: 0:44:26 +pred is: + ['Multi-cultural'] + label is: + ['multi-cultural'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:47:46,729 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:46,729 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 326, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:46,729 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:46,730 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:46,730 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:47,675 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:47,708 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:47,740 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:47,771 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:47,802 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:47,833 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:47,864 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:47,895 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:47,926 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:47,980 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:48,292 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.561784267425537 s; generated tokens: 20 tokens; generate speed: 12.805865968267325 tokens/s +2024-07-30 13:47:48,297 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:48,297 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[97/2067], cost time 1.5729s, every example cost time is 1.5729, generate speed: 12.7153 tokens/s, avg speed: 10.2328 tokens/s, remaining time: 0:44:29 +pred is: + ['commune'] + label is: + ['a commune'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:47:48,379 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:48,380 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 158, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:48,380 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:48,380 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:48,381 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:49,322 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:49,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:49,385 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:49,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:49,452 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:49,483 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:49,514 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:49,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:49,576 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:49,619 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:49,928 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5471231937408447 s; generated tokens: 20 tokens; generate speed: 12.927218776703413 tokens/s +2024-07-30 13:47:49,933 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:49,933 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[98/2067], cost time 1.5583s, every example cost time is 1.5583, generate speed: 12.8342 tokens/s, avg speed: 10.2633 tokens/s, remaining time: 0:44:32 +pred is: + ['1'] + label is: + ['Warsaw City Council'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:47:50,039 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:50,039 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 217, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:50,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:50,040 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:50,040 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:50,984 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:51,016 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:51,047 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:51,050 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0094914436340332 s; generated tokens: 3 tokens; generate speed: 2.971793390541681 tokens/s +2024-07-30 13:47:51,055 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:51,055 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[99/2067], cost time 1.0210s, every example cost time is 1.0210, generate speed: 2.9384 tokens/s, avg speed: 10.2075 tokens/s, remaining time: 0:44:24 +pred is: + ['President'] + label is: + ['President'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:47:51,137 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:51,137 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 351, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:51,137 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:51,138 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:51,138 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:52,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:52,117 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:52,149 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:52,180 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:52,211 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:52,242 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:52,273 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:52,304 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:52,335 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:52,366 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:52,699 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5613317489624023 s; generated tokens: 20 tokens; generate speed: 12.809577473391666 tokens/s +2024-07-30 13:47:52,704 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:52,704 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[100/2067], cost time 1.5725s, every example cost time is 1.5725, generate speed: 12.7185 tokens/s, avg speed: 10.2366 tokens/s, remaining time: 0:44:27 +pred is: + ['Śródmieście'] + label is: + ['Śródmieście'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 71.01380952380951, Em score: 60.0, current_count: 100 +2024-07-30 13:47:52,841 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:52,842 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 186, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:52,842 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:52,842 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:52,843 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:53,787 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:53,819 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:53,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:53,881 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:53,912 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:53,943 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:53,973 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:54,004 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:54,035 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:54,066 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:54,343 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.499891757965088 s; generated tokens: 19 tokens; generate speed: 12.66758077648044 tokens/s +2024-07-30 13:47:54,347 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:54,348 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[101/2067], cost time 1.5116s, every example cost time is 1.5116, generate speed: 12.5692 tokens/s, avg speed: 10.2623 tokens/s, remaining time: 0:44:28 +pred is: + ['1817'] + label is: + ['1817'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:47:54,430 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:54,430 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 234, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:54,431 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:54,431 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:54,431 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:55,375 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:55,406 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:55,437 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:55,467 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:55,470 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0385780334472656 s; generated tokens: 4 tokens; generate speed: 3.851419798205372 tokens/s +2024-07-30 13:47:55,475 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:55,475 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[102/2067], cost time 1.0496s, every example cost time is 1.0496, generate speed: 3.8109 tokens/s, avg speed: 10.2133 tokens/s, remaining time: 0:44:21 +pred is: + ['1951'] + label is: + ['1951'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:47:55,556 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:55,556 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 200, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:55,557 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:55,557 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:55,557 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:56,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:56,533 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:56,564 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:56,596 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:56,627 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:56,658 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:56,689 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:56,720 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:56,751 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:56,781 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:57,090 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5321271419525146 s; generated tokens: 19 tokens; generate speed: 12.401059598609258 tokens/s +2024-07-30 13:47:57,094 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:57,095 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[103/2067], cost time 1.5434s, every example cost time is 1.5434, generate speed: 12.3106 tokens/s, avg speed: 10.2365 tokens/s, remaining time: 0:44:23 +pred is: + ['Warszawa'] + label is: + ['Warszawa'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:47:57,177 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:57,177 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 211, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:57,177 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:57,178 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:57,178 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:58,121 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:58,153 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:58,193 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:58,224 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:58,255 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:58,285 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:58,316 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:58,347 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:58,378 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:58,409 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:58,717 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.539494276046753 s; generated tokens: 20 tokens; generate speed: 12.991279221484172 tokens/s +2024-07-30 13:47:58,722 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:58,723 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[104/2067], cost time 1.5508s, every example cost time is 1.5508, generate speed: 12.8967 tokens/s, avg speed: 10.2657 tokens/s, remaining time: 0:44:26 +pred is: + ['France'] + label is: + ['France'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:47:58,805 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:47:58,805 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 336, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:47:58,805 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:58,806 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:47:58,806 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:47:59,751 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:59,784 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:59,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:59,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:59,885 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:59,916 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:59,947 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:47:59,950 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1437649726867676 s; generated tokens: 7 tokens; generate speed: 6.120138461275493 tokens/s +2024-07-30 13:47:59,954 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:47:59,955 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[105/2067], cost time 1.1549s, every example cost time is 1.1549, generate speed: 6.0612 tokens/s, avg speed: 10.2316 tokens/s, remaining time: 0:44:20 +pred is: + ['William the Conqueror'] + label is: + ['William the Conqueror'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:00,037 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:00,037 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 143, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:00,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:00,038 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:00,038 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:00,979 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:01,011 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:01,042 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:01,073 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:01,104 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:01,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:01,165 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:01,168 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.129760503768921 s; generated tokens: 7 tokens; generate speed: 6.196003468565022 tokens/s +2024-07-30 13:48:01,172 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:01,173 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[106/2067], cost time 1.1409s, every example cost time is 1.1409, generate speed: 6.1354 tokens/s, avg speed: 10.1990 tokens/s, remaining time: 0:44:15 +pred is: + ['Norseman, Viking'] + label is: + ['Viking'] +The F1/Em of this example is: {'F1': 40.0, 'Em': 0.0} +2024-07-30 13:48:01,261 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:01,261 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 251, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:01,262 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:01,262 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:01,262 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:02,206 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:02,238 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:02,269 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:02,300 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:02,331 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:02,365 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:02,396 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:02,427 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:02,458 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:02,489 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:02,775 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5127642154693604 s; generated tokens: 19 tokens; generate speed: 12.559789427663672 tokens/s +2024-07-30 13:48:02,780 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:02,780 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[107/2067], cost time 1.5244s, every example cost time is 1.5244, generate speed: 12.4640 tokens/s, avg speed: 10.2228 tokens/s, remaining time: 0:44:17 +pred is: + ['911'] + label is: + ['911'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:02,869 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:02,870 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 202, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:02,870 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:02,870 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:02,871 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:03,813 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:03,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:03,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:03,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:03,910 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0394678115844727 s; generated tokens: 4 tokens; generate speed: 3.848123006236003 tokens/s +2024-07-30 13:48:03,915 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:03,915 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[108/2067], cost time 1.0511s, every example cost time is 1.0511, generate speed: 3.8055 tokens/s, avg speed: 10.1766 tokens/s, remaining time: 0:44:10 +pred is: + ['Rollo'] + label is: + ['Rollo'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:04,007 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:04,007 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 150, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:04,008 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:04,008 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:04,008 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:04,950 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:04,982 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:05,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:05,045 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:05,075 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:05,106 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:05,137 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:05,167 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:05,198 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:05,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:05,416 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4071097373962402 s; generated tokens: 16 tokens; generate speed: 11.370826009353683 tokens/s +2024-07-30 13:48:05,421 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:05,421 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[109/2067], cost time 1.4188s, every example cost time is 1.4188, generate speed: 11.2772 tokens/s, avg speed: 10.1872 tokens/s, remaining time: 0:44:10 +pred is: + ['Catholicism'] + label is: + ['Catholicism'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:05,503 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:05,503 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 180, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:05,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:05,504 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:05,504 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:06,446 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:06,478 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:06,509 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:06,540 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:06,570 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:06,604 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:06,607 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1024839878082275 s; generated tokens: 6 tokens; generate speed: 5.442255911515039 tokens/s +2024-07-30 13:48:06,611 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:06,612 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[110/2067], cost time 1.1136s, every example cost time is 1.1136, generate speed: 5.3877 tokens/s, avg speed: 10.1513 tokens/s, remaining time: 0:44:04 +pred is: + ['Fighting horsemen'] + label is: + ['fighting horsemen'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 73.1034632034632, Em score: 62.72727272727273, current_count: 110 +2024-07-30 13:48:06,716 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:06,716 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 245, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:06,717 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:06,717 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:06,717 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:07,661 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:07,693 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:07,724 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:07,754 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:07,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:07,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:07,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:07,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:07,908 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:07,948 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:08,080 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3631422519683838 s; generated tokens: 14 tokens; generate speed: 10.270388126979363 tokens/s +2024-07-30 13:48:08,085 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:08,085 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[111/2067], cost time 1.3744s, every example cost time is 1.3744, generate speed: 10.1865 tokens/s, avg speed: 10.1516 tokens/s, remaining time: 0:44:03 +pred is: + ['999'] + label is: + ['999'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:08,167 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:08,167 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 253, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:08,168 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:08,168 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:08,168 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:09,112 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:09,145 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:09,176 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:09,207 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:09,237 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:09,240 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0717649459838867 s; generated tokens: 5 tokens; generate speed: 4.665202028426084 tokens/s +2024-07-30 13:48:09,245 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:09,245 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[112/2067], cost time 1.0828s, every example cost time is 1.0828, generate speed: 4.6176 tokens/s, avg speed: 10.1119 tokens/s, remaining time: 0:43:57 +pred is: + ['Drogo'] + label is: + ['Drogo'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:09,327 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:09,327 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 221, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:09,327 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:09,328 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:09,328 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:10,271 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:10,304 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:10,335 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:10,366 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:10,397 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:10,428 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:10,458 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:10,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:10,538 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:10,569 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:10,879 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5509593486785889 s; generated tokens: 20 tokens; generate speed: 12.895244493055166 tokens/s +2024-07-30 13:48:10,886 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:10,886 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[113/2067], cost time 1.5643s, every example cost time is 1.5643, generate speed: 12.7852 tokens/s, avg speed: 10.1393 tokens/s, remaining time: 0:44:00 +pred is: + ['Saracens'] + label is: + ['Saracens'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:10,971 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:10,972 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 236, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:10,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:10,972 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:10,973 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:11,919 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:11,952 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:11,983 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:12,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:12,044 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:12,075 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:12,077 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.104405403137207 s; generated tokens: 6 tokens; generate speed: 5.432787618528685 tokens/s +2024-07-30 13:48:12,082 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:12,082 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[114/2067], cost time 1.1169s, every example cost time is 1.1169, generate speed: 5.3721 tokens/s, avg speed: 10.1047 tokens/s, remaining time: 0:43:54 +pred is: + ['The Book of Roger'] + label is: + ['Kitab Rudjdjar'] +The F1/Em of this example is: {'F1': 20.0, 'Em': 0.0} +2024-07-30 13:48:12,165 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:12,165 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 216, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:12,166 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:12,166 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:12,166 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:13,109 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:13,142 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:13,173 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:13,204 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:13,235 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:13,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:13,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:13,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:13,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:13,391 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:13,701 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5351691246032715 s; generated tokens: 20 tokens; generate speed: 13.02788056343208 tokens/s +2024-07-30 13:48:13,707 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:13,707 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[115/2067], cost time 1.5467s, every example cost time is 1.5467, generate speed: 12.9309 tokens/s, avg speed: 10.1328 tokens/s, remaining time: 0:43:56 +pred is: + ['Seljuk Turks'] + label is: + ['Seljuk Turks'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:13,789 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:13,790 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 180, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:13,790 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:13,790 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:13,791 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:14,733 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:14,766 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:14,798 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:14,829 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:14,860 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:14,862 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.071535587310791 s; generated tokens: 5 tokens; generate speed: 4.666200599597806 tokens/s +2024-07-30 13:48:14,867 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:14,867 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[116/2067], cost time 1.0829s, every example cost time is 1.0829, generate speed: 4.6174 tokens/s, avg speed: 10.0947 tokens/s, remaining time: 0:43:50 +pred is: + ['1050s'] + label is: + ['1050s'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:14,952 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:14,952 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 243, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:14,953 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:14,953 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:14,953 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:15,900 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:15,970 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:16,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:16,033 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:16,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:16,115 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:16,118 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1647813320159912 s; generated tokens: 6 tokens; generate speed: 5.151181457909583 tokens/s +2024-07-30 13:48:16,123 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:16,123 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[117/2067], cost time 1.1763s, every example cost time is 1.1763, generate speed: 5.1008 tokens/s, avg speed: 10.0574 tokens/s, remaining time: 0:43:46 +pred is: + ['Afranji'] + label is: + ['Afranji'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:16,206 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:16,206 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 154, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:16,207 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:16,207 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:16,207 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:17,150 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:17,182 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:17,214 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:17,245 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:17,277 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:17,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:17,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:17,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:17,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:17,431 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:17,741 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5331223011016846 s; generated tokens: 20 tokens; generate speed: 13.045273678184854 tokens/s +2024-07-30 13:48:17,745 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:17,746 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[118/2067], cost time 1.5443s, every example cost time is 1.5443, generate speed: 12.9507 tokens/s, avg speed: 10.0855 tokens/s, remaining time: 0:43:48 +pred is: + ['Italo-Norman'] + label is: + ['Norman mercenary'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:48:17,827 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:17,828 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 435, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:17,828 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:17,828 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:17,828 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:18,775 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:18,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:18,840 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:18,871 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:18,902 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:18,933 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:18,965 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:18,996 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:19,048 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:19,081 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:19,362 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5334970951080322 s; generated tokens: 19 tokens; generate speed: 12.389981083506052 tokens/s +2024-07-30 13:48:19,367 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:19,367 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[119/2067], cost time 1.5447s, every example cost time is 1.5447, generate speed: 12.3003 tokens/s, avg speed: 10.1068 tokens/s, remaining time: 0:43:50 +pred is: + ['Robert Guiscard'] + label is: + ['Robert Guiscard'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:19,449 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:19,449 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 231, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:19,450 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:19,450 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:19,450 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:20,394 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:20,427 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:20,458 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:20,513 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:20,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:20,576 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:20,607 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:20,638 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:20,669 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:20,700 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:21,010 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.559340476989746 s; generated tokens: 20 tokens; generate speed: 12.82593525604448 tokens/s +2024-07-30 13:48:21,015 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:21,015 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[120/2067], cost time 1.5705s, every example cost time is 1.5705, generate speed: 12.7351 tokens/s, avg speed: 10.1322 tokens/s, remaining time: 0:43:52 +pred is: + ['Deabolis'] + label is: + ['Deabolis'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 73.84484126984127, Em score: 64.16666666666667, current_count: 120 +2024-07-30 13:48:21,123 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:21,123 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 119, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:21,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:21,124 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:21,124 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:22,065 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:22,119 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:22,151 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:22,182 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:22,185 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0609402656555176 s; generated tokens: 4 tokens; generate speed: 3.7702405399125283 tokens/s +2024-07-30 13:48:22,190 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:22,190 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[121/2067], cost time 1.0720s, every example cost time is 1.0720, generate speed: 3.7313 tokens/s, avg speed: 10.0902 tokens/s, remaining time: 0:43:46 +pred is: + ['1185'] + label is: + ['1185'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:22,272 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:22,272 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 184, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:22,272 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:22,273 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:22,273 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:23,216 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:23,247 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:23,278 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:23,309 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:23,340 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:23,371 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:23,401 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:23,432 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:23,463 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:23,466 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1928396224975586 s; generated tokens: 9 tokens; generate speed: 7.545020998846323 tokens/s +2024-07-30 13:48:23,471 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:23,471 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[122/2067], cost time 1.2039s, every example cost time is 1.2039, generate speed: 7.4760 tokens/s, avg speed: 10.0711 tokens/s, remaining time: 0:43:43 +pred is: + ['King Ethelred II of England'] + label is: + ['King Ethelred II'] +The F1/Em of this example is: {'F1': 71.42857142857143, 'Em': 0.0} +2024-07-30 13:48:23,553 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:23,553 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 206, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:23,553 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:23,554 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:23,554 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:24,497 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:24,530 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:24,562 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:24,593 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:24,624 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:24,655 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:24,686 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:24,717 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:24,748 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:24,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:25,112 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5581700801849365 s; generated tokens: 20 tokens; generate speed: 12.83556927086306 tokens/s +2024-07-30 13:48:25,117 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:25,117 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[123/2067], cost time 1.5694s, every example cost time is 1.5694, generate speed: 12.7435 tokens/s, avg speed: 10.0963 tokens/s, remaining time: 0:43:45 +pred is: + ['Harthacnut'] + label is: + ['Harthacnut'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:25,199 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:25,200 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:25,200 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:25,200 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:25,200 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:26,142 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:26,175 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:26,206 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:26,237 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:26,240 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.039008617401123 s; generated tokens: 4 tokens; generate speed: 3.8498237002164797 tokens/s +2024-07-30 13:48:26,244 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:26,245 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[124/2067], cost time 1.0501s, every example cost time is 1.0501, generate speed: 3.8090 tokens/s, avg speed: 10.0568 tokens/s, remaining time: 0:43:39 +pred is: + ['Battle of Hastings'] + label is: + ['Battle of Hastings'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:26,327 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:26,327 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:26,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:26,328 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:26,328 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:27,272 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:27,304 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:27,336 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:27,367 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:27,370 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0413331985473633 s; generated tokens: 4 tokens; generate speed: 3.8412296905350867 tokens/s +2024-07-30 13:48:27,374 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:27,375 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[125/2067], cost time 1.0527s, every example cost time is 1.0527, generate speed: 3.7999 tokens/s, avg speed: 10.0177 tokens/s, remaining time: 0:43:33 +pred is: + ['Middle English'] + label is: + ['Modern English'] +The F1/Em of this example is: {'F1': 66.66666666666666, 'Em': 0.0} +2024-07-30 13:48:27,481 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:27,481 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 341, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:27,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:27,482 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:27,482 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:28,427 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:28,459 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:28,491 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:28,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:28,525 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.042954683303833 s; generated tokens: 4 tokens; generate speed: 3.835257719279757 tokens/s +2024-07-30 13:48:28,530 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:28,530 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[126/2067], cost time 1.0783s, every example cost time is 1.0783, generate speed: 3.7096 tokens/s, avg speed: 9.9775 tokens/s, remaining time: 0:43:27 +pred is: + ['1169'] + label is: + ['1169'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:28,611 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:28,612 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 156, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:28,612 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:28,612 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:28,613 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:29,555 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:29,588 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:29,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:29,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:29,682 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:29,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:29,745 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:29,776 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:29,807 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:29,838 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:30,146 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.533475637435913 s; generated tokens: 20 tokens; generate speed: 13.042267846812036 tokens/s +2024-07-30 13:48:30,151 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:30,151 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[127/2067], cost time 1.5447s, every example cost time is 1.5447, generate speed: 12.9478 tokens/s, avg speed: 10.0043 tokens/s, remaining time: 0:43:29 +pred is: + ['Edgar Atheling'] + label is: + ['Edgar'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:48:30,256 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:30,256 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 271, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:30,257 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:30,257 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:30,257 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:31,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:31,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:31,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:31,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:31,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:31,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:31,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:31,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:31,452 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:31,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:31,820 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5622072219848633 s; generated tokens: 20 tokens; generate speed: 12.80239888699848 tokens/s +2024-07-30 13:48:31,824 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:31,825 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[128/2067], cost time 1.5739s, every example cost time is 1.5739, generate speed: 12.7071 tokens/s, avg speed: 10.0290 tokens/s, remaining time: 0:43:31 +pred is: + ['Sybilla of Normandy'] + label is: + ['Sybilla of Normandy'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:31,907 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:31,908 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 112, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:31,908 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:31,908 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:31,908 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:32,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:32,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:32,913 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:32,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:32,947 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0382065773010254 s; generated tokens: 4 tokens; generate speed: 3.8527977836536187 tokens/s +2024-07-30 13:48:32,952 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:32,952 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[129/2067], cost time 1.0493s, every example cost time is 1.0493, generate speed: 3.8121 tokens/s, avg speed: 9.9914 tokens/s, remaining time: 0:43:25 +pred is: + ['Hereford'] + label is: + ['Hereford'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:33,059 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:33,059 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 142, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:33,059 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:33,060 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:33,060 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:34,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:34,034 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:34,066 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:34,097 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:34,100 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0400478839874268 s; generated tokens: 4 tokens; generate speed: 3.8459767685545874 tokens/s +2024-07-30 13:48:34,105 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:34,105 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[130/2067], cost time 1.0516s, every example cost time is 1.0516, generate speed: 3.8037 tokens/s, avg speed: 9.9541 tokens/s, remaining time: 0:43:20 +pred is: + ['Wales'] + label is: + ['Wales'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 74.9959706959707, Em score: 64.61538461538461, current_count: 130 +2024-07-30 13:48:34,214 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:34,214 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 159, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:34,214 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:34,215 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:34,215 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:35,157 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:35,189 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:35,220 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:35,251 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:35,254 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0388786792755127 s; generated tokens: 4 tokens; generate speed: 3.850305218304699 tokens/s +2024-07-30 13:48:35,259 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:35,259 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[131/2067], cost time 1.0500s, every example cost time is 1.0500, generate speed: 3.8096 tokens/s, avg speed: 9.9174 tokens/s, remaining time: 0:43:14 +pred is: + ['1018'] + label is: + ['1018'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:35,341 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:35,341 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 168, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:35,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:35,342 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:35,342 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:36,284 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:36,316 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:36,347 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:36,379 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:36,382 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0401084423065186 s; generated tokens: 4 tokens; generate speed: 3.845752843933946 tokens/s +2024-07-30 13:48:36,387 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:36,387 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[132/2067], cost time 1.0512s, every example cost time is 1.0512, generate speed: 3.8051 tokens/s, avg speed: 9.8810 tokens/s, remaining time: 0:43:08 +pred is: + ['1097'] + label is: + ['1097'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:36,469 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:36,469 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 105, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:36,469 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:36,470 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:36,470 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:37,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:37,443 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:37,474 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:37,506 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:37,509 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0385081768035889 s; generated tokens: 4 tokens; generate speed: 3.851678869117381 tokens/s +2024-07-30 13:48:37,513 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:37,513 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[133/2067], cost time 1.0497s, every example cost time is 1.0497, generate speed: 3.8106 tokens/s, avg speed: 9.8451 tokens/s, remaining time: 0:43:03 +pred is: + ['380 years'] + label is: + ['380 years'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:37,606 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:37,606 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 191, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:37,607 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:37,607 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:37,607 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:38,549 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:38,581 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:38,613 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:38,643 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:38,674 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:38,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:38,736 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:38,767 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:38,770 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1626126766204834 s; generated tokens: 8 tokens; generate speed: 6.881053476257144 tokens/s +2024-07-30 13:48:38,774 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:38,775 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[134/2067], cost time 1.1740s, every example cost time is 1.1740, generate speed: 6.8142 tokens/s, avg speed: 9.8252 tokens/s, remaining time: 0:42:59 +pred is: + ['A storm dispersed the fleet.'] + label is: + ['a storm'] +The F1/Em of this example is: {'F1': 46.15384615384615, 'Em': 0.0} +2024-07-30 13:48:38,863 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:38,863 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 256, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:38,863 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:38,864 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:38,864 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:39,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:39,842 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:39,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:39,906 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:39,937 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:39,967 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:39,999 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:40,030 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:40,033 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.16886305809021 s; generated tokens: 8 tokens; generate speed: 6.844257712337231 tokens/s +2024-07-30 13:48:40,038 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:40,038 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[135/2067], cost time 1.1803s, every example cost time is 1.1803, generate speed: 6.7777 tokens/s, avg speed: 9.8052 tokens/s, remaining time: 0:42:56 +pred is: + ['Conrad of Montferrat'] + label is: + ['Conrad of Montferrat'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:40,121 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:40,121 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 163, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:40,122 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:40,122 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:40,122 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:41,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:41,096 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:41,128 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:41,158 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:41,189 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:41,220 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:41,251 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:41,254 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.131641149520874 s; generated tokens: 7 tokens; generate speed: 6.185706487399943 tokens/s +2024-07-30 13:48:41,259 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:41,259 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[136/2067], cost time 1.1428s, every example cost time is 1.1428, generate speed: 6.1256 tokens/s, avg speed: 9.7820 tokens/s, remaining time: 0:42:52 +pred is: + ['Richard the Lion-Heart'] + label is: + ['Richard the Lion-Heart'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:41,350 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:41,351 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:41,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:41,352 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:41,352 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:42,294 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:42,326 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:42,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:42,388 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:42,392 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0398552417755127 s; generated tokens: 4 tokens; generate speed: 3.846689269143034 tokens/s +2024-07-30 13:48:42,396 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:42,397 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[137/2067], cost time 1.0513s, every example cost time is 1.0513, generate speed: 3.8048 tokens/s, avg speed: 9.7475 tokens/s, remaining time: 0:42:46 +pred is: + ['1489'] + label is: + ['1489'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:42,479 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:42,479 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 129, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:42,479 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:42,480 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:42,480 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:43,422 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:43,459 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:43,490 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:43,494 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0137052536010742 s; generated tokens: 3 tokens; generate speed: 2.959440122602538 tokens/s +2024-07-30 13:48:43,498 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:43,499 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[138/2067], cost time 1.0249s, every example cost time is 1.0249, generate speed: 2.9273 tokens/s, avg speed: 9.7094 tokens/s, remaining time: 0:42:41 +pred is: + ['Africa'] + label is: + ['Africa'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:43,587 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:43,587 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 108, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:43,588 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:43,588 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:43,588 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:44,530 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:44,562 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:44,594 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:44,625 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:44,655 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:44,686 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:44,722 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:44,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:44,784 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:44,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:44,817 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2288603782653809 s; generated tokens: 10 tokens; generate speed: 8.137620983529205 tokens/s +2024-07-30 13:48:44,822 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:44,822 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[139/2067], cost time 1.2403s, every example cost time is 1.2403, generate speed: 8.0624 tokens/s, avg speed: 9.6983 tokens/s, remaining time: 0:42:38 +pred is: + ['Enrique Pérez de Guzmán'] + label is: + ['Bethencourt'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:48:44,905 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:44,905 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 174, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:44,906 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:44,906 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:44,906 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:45,849 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:45,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:45,916 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:45,947 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:45,978 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:46,009 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:46,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:46,070 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:46,101 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:46,132 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:46,441 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5350518226623535 s; generated tokens: 20 tokens; generate speed: 13.0288760970379 tokens/s +2024-07-30 13:48:46,446 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:46,447 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[140/2067], cost time 1.5462s, every example cost time is 1.5462, generate speed: 12.9346 tokens/s, avg speed: 9.7252 tokens/s, remaining time: 0:42:40 +pred is: + ['Channel Islands'] + label is: + ['Channel Islands'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 75.68307169021455, Em score: 65.71428571428571, current_count: 140 +2024-07-30 13:48:46,557 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:46,557 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 122, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:46,558 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:46,558 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:46,558 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:47,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:47,532 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:47,564 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:47,595 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:47,633 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:47,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:47,694 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:47,725 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:47,756 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:47,786 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:48,102 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5432846546173096 s; generated tokens: 20 tokens; generate speed: 12.959372038180103 tokens/s +2024-07-30 13:48:48,107 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:48,107 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[141/2067], cost time 1.5546s, every example cost time is 1.5546, generate speed: 12.8653 tokens/s, avg speed: 9.7512 tokens/s, remaining time: 0:42:42 +pred is: + ['Rounded arches, particularly over windows and doorways, and massive proportions'] + label is: + ['Romanesque'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:48:48,190 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:48,190 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 111, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:48,190 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:48,191 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:48,191 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:49,133 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:49,166 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:49,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:49,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:49,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:49,289 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:49,319 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:49,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:49,381 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:49,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:49,732 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.541351079940796 s; generated tokens: 20 tokens; generate speed: 12.975629147882525 tokens/s +2024-07-30 13:48:49,737 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:49,738 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[142/2067], cost time 1.5529s, every example cost time is 1.5529, generate speed: 12.8789 tokens/s, avg speed: 9.7769 tokens/s, remaining time: 0:42:43 +pred is: + ['Early Gothic'] + label is: + ['Early Gothic'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:49,822 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:49,822 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 272, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:49,822 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:49,823 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:49,823 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:50,767 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:50,799 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:50,830 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:50,861 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:50,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:50,923 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:50,957 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:50,988 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:51,019 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:51,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:51,360 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.536651372909546 s; generated tokens: 20 tokens; generate speed: 13.015313917386054 tokens/s +2024-07-30 13:48:51,365 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:51,365 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[143/2067], cost time 1.5485s, every example cost time is 1.5485, generate speed: 12.9160 tokens/s, avg speed: 9.8024 tokens/s, remaining time: 0:42:45 +pred is: + ['In the early 11th century'] + label is: + ['early 11th century'] +The F1/Em of this example is: {'F1': 71.42857142857143, 'Em': 0.0} +2024-07-30 13:48:51,448 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:51,448 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 139, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:51,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:51,449 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:51,449 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:52,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:52,428 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:52,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:52,491 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:52,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:52,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:52,583 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:52,614 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:52,644 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:52,675 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:52,990 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5407516956329346 s; generated tokens: 20 tokens; generate speed: 12.980676936256158 tokens/s +2024-07-30 13:48:52,994 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:52,995 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[144/2067], cost time 1.5521s, every example cost time is 1.5521, generate speed: 12.8857 tokens/s, avg speed: 9.8273 tokens/s, remaining time: 0:42:46 +pred is: + ['1562-1598'] + label is: + ['16th century'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:48:53,079 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:53,079 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 126, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:53,080 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:53,080 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:53,080 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:54,022 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:54,053 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:54,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:54,115 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:54,146 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:54,177 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:54,208 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:54,239 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:54,270 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:54,301 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:54,611 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5305159091949463 s; generated tokens: 20 tokens; generate speed: 13.067489125624332 tokens/s +2024-07-30 13:48:54,616 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:54,616 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[145/2067], cost time 1.5425s, every example cost time is 1.5425, generate speed: 12.9663 tokens/s, avg speed: 9.8523 tokens/s, remaining time: 0:42:48 +pred is: + ['Embroidery'] + label is: + ['embroidery'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:54,702 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:54,702 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 242, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:54,703 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:54,703 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:54,703 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:55,648 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:55,690 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:55,721 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:55,769 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:55,802 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:55,805 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.101799488067627 s; generated tokens: 5 tokens; generate speed: 4.538030788859023 tokens/s +2024-07-30 13:48:55,810 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:55,810 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[146/2067], cost time 1.1133s, every example cost time is 1.1133, generate speed: 4.4910 tokens/s, avg speed: 9.8217 tokens/s, remaining time: 0:42:44 +pred is: + ['Mosaics'] + label is: + ['mosaics'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:55,892 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:55,893 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 197, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:55,893 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:55,893 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:55,893 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:56,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:56,869 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:56,901 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:56,932 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:56,963 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:56,994 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:57,025 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:57,056 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:57,087 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:57,118 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:57,151 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.257641315460205 s; generated tokens: 11 tokens; generate speed: 8.74653199189373 tokens/s +2024-07-30 13:48:57,156 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:57,156 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[147/2067], cost time 1.2688s, every example cost time is 1.2688, generate speed: 8.6693 tokens/s, avg speed: 9.8142 tokens/s, remaining time: 0:42:41 +pred is: + ['11th'] + label is: + ['11th'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:57,238 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:57,238 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 118, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:57,239 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:57,239 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:57,239 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:58,181 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:58,214 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:58,246 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:58,277 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:58,308 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:58,339 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:58,370 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:58,401 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:58,432 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:58,463 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:58,620 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3805015087127686 s; generated tokens: 15 tokens; generate speed: 10.865616520757419 tokens/s +2024-07-30 13:48:58,625 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:58,625 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[148/2067], cost time 1.3918s, every example cost time is 1.3918, generate speed: 10.7770 tokens/s, avg speed: 9.8210 tokens/s, remaining time: 0:42:41 +pred is: + ['Southern Italy'] + label is: + ['southern Italy'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:58,732 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:58,732 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 115, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:58,733 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:58,733 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:58,733 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:48:59,675 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:59,708 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:59,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:59,770 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:59,773 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0396971702575684 s; generated tokens: 4 tokens; generate speed: 3.847274104832914 tokens/s +2024-07-30 13:48:59,778 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:48:59,778 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[149/2067], cost time 1.0512s, every example cost time is 1.0512, generate speed: 3.8050 tokens/s, avg speed: 9.7891 tokens/s, remaining time: 0:42:36 +pred is: + ['1856'] + label is: + ['1856'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:48:59,861 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:48:59,861 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:48:59,861 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:48:59,862 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:48:59,862 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:00,804 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:00,836 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:00,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:00,899 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:00,930 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:00,961 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:00,992 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:01,023 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:01,054 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:01,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:01,417 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5547473430633545 s; generated tokens: 20 tokens; generate speed: 12.863826453366718 tokens/s +2024-07-30 13:49:01,421 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:01,422 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[150/2067], cost time 1.5660s, every example cost time is 1.5660, generate speed: 12.7710 tokens/s, avg speed: 9.8125 tokens/s, remaining time: 0:42:37 +pred is: + ['1884'] + label is: + ['1884'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 75.78039072039071, Em score: 66.0, current_count: 150 +2024-07-30 13:49:01,560 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:01,561 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 170, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:01,561 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:01,561 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:01,561 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:02,504 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:02,536 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:02,568 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:02,599 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:02,630 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:02,660 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:02,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:02,722 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:02,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:02,756 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1941766738891602 s; generated tokens: 9 tokens; generate speed: 7.5365732699241725 tokens/s +2024-07-30 13:49:02,760 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:02,761 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[151/2067], cost time 1.2057s, every example cost time is 1.2057, generate speed: 7.4648 tokens/s, avg speed: 9.7984 tokens/s, remaining time: 0:42:34 +pred is: + ['1893'] + label is: + ['1893'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:49:02,843 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:02,843 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 186, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:02,843 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:02,844 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:02,844 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:03,786 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:03,819 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:03,851 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:03,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:03,885 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0412535667419434 s; generated tokens: 4 tokens; generate speed: 3.841523455728369 tokens/s +2024-07-30 13:49:03,890 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:03,890 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[152/2067], cost time 1.0524s, every example cost time is 1.0524, generate speed: 3.8009 tokens/s, avg speed: 9.7672 tokens/s, remaining time: 0:42:30 +pred is: + ['1943'] + label is: + ['1943'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:49:03,973 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:03,973 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 183, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:03,974 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:03,974 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:03,974 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:04,917 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:04,950 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:04,981 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:05,012 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:05,043 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:05,074 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:05,105 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:05,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:05,167 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:05,198 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:05,506 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5321500301361084 s; generated tokens: 20 tokens; generate speed: 13.053551941139407 tokens/s +2024-07-30 13:49:05,511 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:05,511 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[153/2067], cost time 1.5434s, every example cost time is 1.5434, generate speed: 12.9585 tokens/s, avg speed: 9.7914 tokens/s, remaining time: 0:42:31 +pred is: + ['Croatia'] + label is: + ['Croatia'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:49:05,594 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:05,594 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 169, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:05,595 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:05,595 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:05,595 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:06,537 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:06,570 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:06,601 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:06,604 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0082955360412598 s; generated tokens: 3 tokens; generate speed: 2.9753181411260745 tokens/s +2024-07-30 13:49:06,608 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:06,609 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[154/2067], cost time 1.0193s, every example cost time is 1.0193, generate speed: 2.9432 tokens/s, avg speed: 9.7573 tokens/s, remaining time: 0:42:26 +pred is: + ['5'] + label is: + ['four'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:49:06,690 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:06,690 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 146, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:06,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:06,691 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:06,691 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:07,633 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:07,688 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:07,720 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:07,751 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:07,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:07,813 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:07,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:07,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:07,906 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:07,937 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:08,246 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5544614791870117 s; generated tokens: 20 tokens; generate speed: 12.86619209789622 tokens/s +2024-07-30 13:49:08,250 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:08,251 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[155/2067], cost time 1.5655s, every example cost time is 1.5655, generate speed: 12.7751 tokens/s, avg speed: 9.7802 tokens/s, remaining time: 0:42:27 +pred is: + ['Martin Sekulić'] + label is: + ['Martin Sekulić'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:49:08,333 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:08,333 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 125, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:08,334 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:08,334 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:08,334 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:09,276 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:09,308 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:09,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:09,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:09,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:09,404 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0692548751831055 s; generated tokens: 5 tokens; generate speed: 4.676153568290975 tokens/s +2024-07-30 13:49:09,408 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:09,409 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[156/2067], cost time 1.0803s, every example cost time is 1.0803, generate speed: 4.6282 tokens/s, avg speed: 9.7534 tokens/s, remaining time: 0:42:23 +pred is: + ['Cholera'] + label is: + ['cholera'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:49:09,491 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:09,491 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 142, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:09,491 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:09,492 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:09,492 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:10,434 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:10,467 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:10,498 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:10,529 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:10,583 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:10,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:10,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:10,677 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:10,708 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:10,738 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:11,046 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.554100751876831 s; generated tokens: 20 tokens; generate speed: 12.869178511011416 tokens/s +2024-07-30 13:49:11,051 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:11,051 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[157/2067], cost time 1.5654s, every example cost time is 1.5654, generate speed: 12.7766 tokens/s, avg speed: 9.7760 tokens/s, remaining time: 0:42:24 +pred is: + ['Tomingaj'] + label is: + ['Tomingaj'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:49:11,134 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:11,134 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 368, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:11,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:11,135 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:11,135 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:12,080 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:12,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:12,163 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:12,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:12,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:12,257 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:12,288 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:12,319 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:12,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:12,381 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:12,384 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.248671293258667 s; generated tokens: 10 tokens; generate speed: 8.008512771926489 tokens/s +2024-07-30 13:49:12,389 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:12,389 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[158/2067], cost time 1.2599s, every example cost time is 1.2599, generate speed: 7.9372 tokens/s, avg speed: 9.7650 tokens/s, remaining time: 0:42:22 +pred is: + ['1875'] + label is: + ['1875'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:49:12,471 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:12,471 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 164, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:12,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:12,472 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:12,472 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:13,414 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:13,446 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:13,478 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:13,509 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:13,539 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:13,570 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:13,601 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:13,632 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:13,662 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:13,697 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:14,007 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5344147682189941 s; generated tokens: 20 tokens; generate speed: 13.034285392869451 tokens/s +2024-07-30 13:49:14,011 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:14,012 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[159/2067], cost time 1.5457s, every example cost time is 1.5457, generate speed: 12.9394 tokens/s, avg speed: 9.7882 tokens/s, remaining time: 0:42:23 +pred is: + ['He dropped out of school'] + label is: + ['left Graz'] +The F1/Em of this example is: {'F1': 16.666666666666664, 'Em': 0.0} +2024-07-30 13:49:14,095 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:14,095 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 134, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:14,096 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:14,096 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:14,096 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:15,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:15,074 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:15,105 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:15,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:15,167 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:15,198 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:15,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:15,260 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:15,291 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:15,321 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:15,632 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5361254215240479 s; generated tokens: 20 tokens; generate speed: 13.01977020870942 tokens/s +2024-07-30 13:49:15,637 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:15,637 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[160/2067], cost time 1.5474s, every example cost time is 1.5474, generate speed: 12.9247 tokens/s, avg speed: 9.8109 tokens/s, remaining time: 0:42:25 +pred is: + ['For not having a residence permit'] + label is: + ['not having a residence permit'] +The F1/Em of this example is: {'F1': 90.0, 'Em': 0.0} +F1 score: 76.08578296703297, Em score: 66.25, current_count: 160 +2024-07-30 13:49:15,752 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:15,752 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 142, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:15,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:15,753 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:15,753 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:16,695 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:16,727 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:16,758 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:16,789 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:16,792 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0388391017913818 s; generated tokens: 4 tokens; generate speed: 3.8504519064620983 tokens/s +2024-07-30 13:49:16,797 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:16,797 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[161/2067], cost time 1.0500s, every example cost time is 1.0500, generate speed: 3.8097 tokens/s, avg speed: 9.7815 tokens/s, remaining time: 0:42:20 +pred is: + ['Prague'] + label is: + ['Prague'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:49:16,883 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:16,883 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 160, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:16,884 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:16,884 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:16,884 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:17,827 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:17,860 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:17,891 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:17,922 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:17,953 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:17,984 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:18,015 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:18,046 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:18,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:18,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:18,264 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3790435791015625 s; generated tokens: 15 tokens; generate speed: 10.877103687885192 tokens/s +2024-07-30 13:49:18,268 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:18,269 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[162/2067], cost time 1.3905s, every example cost time is 1.3905, generate speed: 10.7876 tokens/s, avg speed: 9.7880 tokens/s, remaining time: 0:42:19 +pred is: + ['Budapest'] + label is: + ['Budapest'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:49:18,351 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:18,351 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 129, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:18,352 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:18,352 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:18,352 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:19,294 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:19,327 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:19,358 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:19,389 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:19,427 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:19,458 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:19,489 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:19,520 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:19,551 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:19,593 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:19,781 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4287188053131104 s; generated tokens: 16 tokens; generate speed: 11.198844685531752 tokens/s +2024-07-30 13:49:19,786 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:19,786 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[163/2067], cost time 1.4400s, every example cost time is 1.4400, generate speed: 11.1107 tokens/s, avg speed: 9.7968 tokens/s, remaining time: 0:42:19 +pred is: + ['1882'] + label is: + ['1882'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:49:19,875 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:19,875 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 223, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:19,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:19,876 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:19,876 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:20,819 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:20,852 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:20,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:20,915 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:20,952 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:20,955 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.078833818435669 s; generated tokens: 5 tokens; generate speed: 4.634634097075398 tokens/s +2024-07-30 13:49:20,960 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:20,960 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[164/2067], cost time 1.0903s, every example cost time is 1.0903, generate speed: 4.5860 tokens/s, avg speed: 9.7708 tokens/s, remaining time: 0:42:15 +pred is: + ['50,000'] + label is: + ['fifty thousand dollars'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:49:21,042 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:21,042 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 124, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:21,042 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:21,043 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:21,043 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:21,985 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:22,017 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:22,049 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:22,080 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:22,110 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:22,141 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:22,172 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:22,203 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:22,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:22,265 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:22,577 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5342533588409424 s; generated tokens: 20 tokens; generate speed: 13.035656650026223 tokens/s +2024-07-30 13:49:22,582 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:22,582 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[165/2067], cost time 1.5454s, every example cost time is 1.5454, generate speed: 12.9413 tokens/s, avg speed: 9.7930 tokens/s, remaining time: 0:42:16 +pred is: + ['Robert Lane and Benjamin Vail'] + label is: + ['Robert Lane and Benjamin Vail'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:49:22,665 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:22,665 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:22,666 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:22,666 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:22,666 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:23,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:23,642 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:23,673 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:23,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:23,735 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:23,767 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:23,797 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:23,828 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:23,861 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:23,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:24,208 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5414845943450928 s; generated tokens: 20 tokens; generate speed: 12.974505274570777 tokens/s +2024-07-30 13:49:24,213 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:24,213 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[166/2067], cost time 1.5527s, every example cost time is 1.5527, generate speed: 12.8808 tokens/s, avg speed: 9.8147 tokens/s, remaining time: 0:42:17 +pred is: + ['They forced him out of the company'] + label is: + ['forced Tesla out'] +The F1/Em of this example is: {'F1': 22.22222222222222, 'Em': 0.0} +2024-07-30 13:49:24,295 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:24,296 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 185, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:24,296 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:24,296 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:24,297 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:25,239 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:25,272 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:25,304 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:25,334 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:25,365 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:25,396 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:25,426 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:25,457 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:25,488 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:25,519 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:25,836 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5394608974456787 s; generated tokens: 20 tokens; generate speed: 12.991560898483762 tokens/s +2024-07-30 13:49:25,842 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:25,842 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[167/2067], cost time 1.5515s, every example cost time is 1.5515, generate speed: 12.8909 tokens/s, avg speed: 9.8360 tokens/s, remaining time: 0:42:18 +pred is: + ['A Western Union superintendent'] + label is: + ['a Western Union superintendent'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:49:25,926 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:25,926 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 171, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:25,927 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:25,927 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:25,927 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:26,870 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:26,902 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:26,933 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:26,964 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:26,996 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:27,027 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:27,058 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:27,089 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:27,119 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:27,150 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:27,459 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5317778587341309 s; generated tokens: 20 tokens; generate speed: 13.056723522905667 tokens/s +2024-07-30 13:49:27,464 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:27,465 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[168/2067], cost time 1.5436s, every example cost time is 1.5436, generate speed: 12.9566 tokens/s, avg speed: 9.8575 tokens/s, remaining time: 0:42:19 +pred is: + ['1'] + label is: + ['an induction motor'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:49:27,547 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:27,548 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 189, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:27,548 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:27,548 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:27,549 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:28,491 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:28,524 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:28,555 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:28,586 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:28,616 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:28,647 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:28,678 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:28,708 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:28,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:28,770 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:29,079 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.530040979385376 s; generated tokens: 20 tokens; generate speed: 13.071545317716971 tokens/s +2024-07-30 13:49:29,084 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:29,084 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[169/2067], cost time 1.5416s, every example cost time is 1.5416, generate speed: 12.9738 tokens/s, avg speed: 9.8787 tokens/s, remaining time: 0:42:20 +pred is: + ['1'] + label is: + ['editor of Electrical World magazine'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:49:29,168 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:29,169 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 154, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:29,169 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:29,169 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:29,169 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:30,111 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:30,144 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:30,175 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:30,206 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:30,237 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:30,268 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:30,299 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:30,330 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:30,361 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:30,365 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.19498610496521 s; generated tokens: 9 tokens; generate speed: 7.531468326371895 tokens/s +2024-07-30 13:49:30,369 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:30,370 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[170/2067], cost time 1.2064s, every example cost time is 1.2064, generate speed: 7.4600 tokens/s, avg speed: 9.8659 tokens/s, remaining time: 0:42:18 +pred is: + ['1888'] + label is: + ['1888'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 75.2702793938088, Em score: 65.88235294117646, current_count: 170 +2024-07-30 13:49:30,488 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:30,488 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 160, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:30,489 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:30,489 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:30,489 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:31,432 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:31,464 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:31,497 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:31,528 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:31,559 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:31,590 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:31,621 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:31,652 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:31,683 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:31,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:32,029 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5398106575012207 s; generated tokens: 20 tokens; generate speed: 12.988609932376797 tokens/s +2024-07-30 13:49:32,034 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:32,034 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[171/2067], cost time 1.5514s, every example cost time is 1.5514, generate speed: 12.8915 tokens/s, avg speed: 9.8864 tokens/s, remaining time: 0:42:19 +pred is: + ['Pittsburgh'] + label is: + ['Pittsburgh'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:49:32,141 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:32,142 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 299, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:32,142 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:32,143 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:32,143 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:33,088 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:33,121 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:33,153 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:33,184 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:33,215 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:33,246 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:33,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:33,327 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:33,358 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:33,389 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:33,700 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5568890571594238 s; generated tokens: 20 tokens; generate speed: 12.846130498527886 tokens/s +2024-07-30 13:49:33,705 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:33,705 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[172/2067], cost time 1.5685s, every example cost time is 1.5685, generate speed: 12.7511 tokens/s, avg speed: 9.9059 tokens/s, remaining time: 0:42:20 +pred is: + ['Thomas Edison and George Westinghouse'] + label is: + ['Thomas Edison and George Westinghouse'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:49:33,788 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:33,788 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 202, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:33,788 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:33,788 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:33,789 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:34,732 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:34,765 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:34,796 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:34,827 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:34,858 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:34,890 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:34,921 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:34,951 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:34,982 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:35,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:35,323 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5341315269470215 s; generated tokens: 20 tokens; generate speed: 13.036691866831484 tokens/s +2024-07-30 13:49:35,328 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:35,328 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[173/2067], cost time 1.5453s, every example cost time is 1.5453, generate speed: 12.9422 tokens/s, avg speed: 9.9261 tokens/s, remaining time: 0:42:21 +pred is: + ['1'] + label is: + ['George Westinghouse'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:49:35,434 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:35,434 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 255, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:35,435 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:35,435 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:35,435 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:36,379 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:36,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:36,443 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:36,474 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:36,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:36,536 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:36,567 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:36,599 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:36,630 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:36,661 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:36,993 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5583012104034424 s; generated tokens: 20 tokens; generate speed: 12.834489164531947 tokens/s +2024-07-30 13:49:36,998 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:36,999 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[174/2067], cost time 1.5700s, every example cost time is 1.5700, generate speed: 12.7391 tokens/s, avg speed: 9.9450 tokens/s, remaining time: 0:42:22 +pred is: + ['1'] + label is: + ['Richard Dean Adams'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:49:37,081 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:37,081 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 305, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:37,081 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:37,082 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:37,082 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:38,026 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:38,059 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:38,090 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:38,121 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:38,152 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:38,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:38,214 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:38,245 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:38,275 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:38,278 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1961021423339844 s; generated tokens: 9 tokens; generate speed: 7.524441000028704 tokens/s +2024-07-30 13:49:38,283 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:38,313 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[175/2067], cost time 1.2373s, every example cost time is 1.2373, generate speed: 7.2738 tokens/s, avg speed: 9.9309 tokens/s, remaining time: 0:42:19 +pred is: + ['1896'] + label is: + ['1896'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:49:38,396 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:38,396 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 128, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:38,397 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:38,397 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:38,397 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:39,339 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:39,371 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:39,402 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:39,404 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0071592330932617 s; generated tokens: 3 tokens; generate speed: 2.9786749715694696 tokens/s +2024-07-30 13:49:39,409 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:39,410 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[176/2067], cost time 1.0189s, every example cost time is 1.0189, generate speed: 2.9445 tokens/s, avg speed: 9.9007 tokens/s, remaining time: 0:42:15 +pred is: + ['35'] + label is: + ['35'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:49:39,492 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:39,492 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 91, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:39,493 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:39,493 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:39,493 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:40,435 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:40,468 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:40,499 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:40,530 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:40,560 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:40,591 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:40,621 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:40,652 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:40,683 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:40,713 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:41,019 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5260653495788574 s; generated tokens: 20 tokens; generate speed: 13.105598659663773 tokens/s +2024-07-30 13:49:41,024 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:41,024 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[177/2067], cost time 1.5374s, every example cost time is 1.5374, generate speed: 13.0093 tokens/s, avg speed: 9.9209 tokens/s, remaining time: 0:42:15 +pred is: + ['American Institute of Electrical Engineers'] + label is: + ['American Institute of Electrical Engineers'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:49:41,108 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:41,108 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 267, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:41,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:41,109 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:41,109 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:42,053 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:42,085 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:42,116 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:42,147 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:42,178 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:42,233 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:42,265 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:42,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:42,326 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:42,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:42,689 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5804193019866943 s; generated tokens: 20 tokens; generate speed: 12.65486948612855 tokens/s +2024-07-30 13:49:42,694 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:42,695 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[178/2067], cost time 1.5916s, every example cost time is 1.5916, generate speed: 12.5660 tokens/s, avg speed: 9.9385 tokens/s, remaining time: 0:42:17 +pred is: + ['He noticed damaged film in his laboratory in previous experiments.'] + label is: + ['he had noticed damaged film in his laboratory in previous experiments'] +The F1/Em of this example is: {'F1': 87.80487804878048, 'Em': 0.0} +2024-07-30 13:49:42,778 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:42,778 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 183, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:42,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:42,779 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:42,779 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:43,721 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:43,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:43,784 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:43,815 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:43,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:43,848 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0690059661865234 s; generated tokens: 5 tokens; generate speed: 4.677242371094105 tokens/s +2024-07-30 13:49:43,853 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:43,853 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[179/2067], cost time 1.0800s, every example cost time is 1.0800, generate speed: 4.6298 tokens/s, avg speed: 9.9146 tokens/s, remaining time: 0:42:12 +pred is: + ['X-ray imaging'] + label is: + ['X-ray imaging'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:49:43,935 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:43,935 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 159, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:43,936 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:43,936 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:43,936 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:44,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:44,909 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:44,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:44,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:45,001 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:45,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:45,062 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:45,093 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:45,124 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:45,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:45,465 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.528944969177246 s; generated tokens: 20 tokens; generate speed: 13.080915535346163 tokens/s +2024-07-30 13:49:45,470 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:45,470 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[180/2067], cost time 1.5401s, every example cost time is 1.5401, generate speed: 12.9865 tokens/s, avg speed: 9.9342 tokens/s, remaining time: 0:42:13 +pred is: + ['1'] + label is: + ['X-rays were longitudinal waves'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 74.90973541664599, Em score: 65.55555555555556, current_count: 180 +2024-07-30 13:49:45,622 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:45,622 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 112, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:45,623 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:45,623 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:45,623 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:46,565 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:46,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:46,628 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:46,659 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:46,690 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:46,720 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:46,751 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:46,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:46,813 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:46,844 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:47,153 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.529965877532959 s; generated tokens: 20 tokens; generate speed: 13.072186964228 tokens/s +2024-07-30 13:49:47,159 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:47,159 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[181/2067], cost time 1.5422s, every example cost time is 1.5422, generate speed: 12.9682 tokens/s, avg speed: 9.9534 tokens/s, remaining time: 0:42:14 +pred is: + ['Benjamin Lamme'] + label is: + ['Benjamin Lamme'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:49:47,241 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:47,241 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 82, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:47,242 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:47,242 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:47,242 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:48,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:48,214 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:48,245 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:48,276 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:48,306 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:48,337 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:48,368 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:48,423 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:48,454 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:48,485 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:48,794 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5512869358062744 s; generated tokens: 20 tokens; generate speed: 12.892521388768797 tokens/s +2024-07-30 13:49:48,798 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:48,799 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[182/2067], cost time 1.5624s, every example cost time is 1.5624, generate speed: 12.8006 tokens/s, avg speed: 9.9716 tokens/s, remaining time: 0:42:15 +pred is: + ['Egg of Columbus'] + label is: + ['Egg of Columbus'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:49:48,882 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:48,882 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 180, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:48,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:48,883 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:48,883 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:49,826 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:49,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:49,890 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:49,921 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:49,952 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:49,983 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:50,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:50,044 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:50,075 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:50,105 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:50,413 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.530275583267212 s; generated tokens: 20 tokens; generate speed: 13.069541341892837 tokens/s +2024-07-30 13:49:50,418 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:50,418 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[183/2067], cost time 1.5415s, every example cost time is 1.5415, generate speed: 12.9742 tokens/s, avg speed: 9.9904 tokens/s, remaining time: 0:42:16 +pred is: + ['11 July 1934'] + label is: + ['1934'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +2024-07-30 13:49:50,501 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:50,501 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 125, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:50,502 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:50,502 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:50,502 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:51,444 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:51,476 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:51,507 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:51,538 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:51,568 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:51,599 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:51,630 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:51,660 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:51,663 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1608266830444336 s; generated tokens: 8 tokens; generate speed: 6.891640342913947 tokens/s +2024-07-30 13:49:51,668 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:51,668 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[184/2067], cost time 1.1720s, every example cost time is 1.1720, generate speed: 6.8261 tokens/s, avg speed: 9.9754 tokens/s, remaining time: 0:42:12 +pred is: + ['Franklin Institute'] + label is: + ['National Electric Light Association'] +The F1/Em of this example is: {'F1': 20.0, 'Em': 0.0} +2024-07-30 13:49:51,750 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:51,750 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 207, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:51,750 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:51,751 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:51,751 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:52,694 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:52,726 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:52,757 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:52,787 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:52,819 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:52,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:52,904 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:52,935 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:52,966 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:52,997 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:53,030 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2793738842010498 s; generated tokens: 11 tokens; generate speed: 8.597955715556393 tokens/s +2024-07-30 13:49:53,035 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:53,035 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[185/2067], cost time 1.2905s, every example cost time is 1.2905, generate speed: 8.5235 tokens/s, avg speed: 9.9679 tokens/s, remaining time: 0:42:11 +pred is: + ['1898'] + label is: + ['1898'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:49:53,117 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:53,117 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 260, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:53,118 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:53,118 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:53,118 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:54,062 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:54,099 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:54,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:54,162 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:54,193 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:54,224 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:54,255 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:54,286 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:54,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:54,348 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:54,658 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5400028228759766 s; generated tokens: 20 tokens; generate speed: 12.986989181389761 tokens/s +2024-07-30 13:49:54,663 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:54,663 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[186/2067], cost time 1.5513s, every example cost time is 1.5513, generate speed: 12.8921 tokens/s, avg speed: 9.9860 tokens/s, remaining time: 0:42:11 +pred is: + ['1900'] + label is: + ['1900'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:49:54,745 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:54,746 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 215, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:54,746 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:54,746 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:54,747 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:55,689 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:55,722 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:55,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:55,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:55,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:55,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:55,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:55,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:55,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:55,968 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:56,002 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2553048133850098 s; generated tokens: 11 tokens; generate speed: 8.762811934368193 tokens/s +2024-07-30 13:49:56,007 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:56,007 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[187/2067], cost time 1.2665s, every example cost time is 1.2665, generate speed: 8.6854 tokens/s, avg speed: 9.9794 tokens/s, remaining time: 0:42:09 +pred is: + ['1899'] + label is: + ['1899'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:49:56,089 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:56,089 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 95, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:56,089 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:56,090 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:56,090 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:57,031 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:57,063 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:57,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:57,124 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:57,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:57,186 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:57,217 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:57,247 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:57,282 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:57,313 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:57,622 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5319809913635254 s; generated tokens: 20 tokens; generate speed: 13.054992269975351 tokens/s +2024-07-30 13:49:57,627 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:57,627 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[188/2067], cost time 1.5433s, every example cost time is 1.5433, generate speed: 12.9594 tokens/s, avg speed: 9.9976 tokens/s, remaining time: 0:42:10 +pred is: + ['1'] + label is: + ['atmospheric'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:49:57,710 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:57,710 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 171, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:57,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:57,711 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:57,711 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:49:58,653 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:58,686 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:58,717 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:58,747 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:58,778 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:58,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:58,839 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:58,871 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:58,902 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:58,933 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:59,251 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5402216911315918 s; generated tokens: 20 tokens; generate speed: 12.9851437070115 tokens/s +2024-07-30 13:49:59,256 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:49:59,256 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[189/2067], cost time 1.5514s, every example cost time is 1.5514, generate speed: 12.8913 tokens/s, avg speed: 10.0152 tokens/s, remaining time: 0:42:10 +pred is: + ['Lightning'] + label is: + ['lightning'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:49:59,338 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:49:59,338 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 148, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:49:59,339 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:49:59,339 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:49:59,339 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:00,281 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:00,314 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:00,345 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:00,376 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:00,406 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:00,437 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:00,468 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:00,499 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:00,530 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:00,561 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:00,746 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.406700849533081 s; generated tokens: 16 tokens; generate speed: 11.374131184544886 tokens/s +2024-07-30 13:50:00,751 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:00,751 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[190/2067], cost time 1.4180s, every example cost time is 1.4180, generate speed: 11.2835 tokens/s, avg speed: 10.0223 tokens/s, remaining time: 0:42:10 +pred is: + ['A power outage'] + label is: + ['power outage'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +F1 score: 74.80045109647163, Em score: 65.26315789473684, current_count: 190 +2024-07-30 13:50:00,884 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:00,884 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 285, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:00,885 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:00,885 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:00,885 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:01,830 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:01,862 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:01,893 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:01,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:01,954 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:01,985 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:02,016 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:02,047 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:02,078 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:02,109 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:02,426 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5403246879577637 s; generated tokens: 20 tokens; generate speed: 12.984275429952993 tokens/s +2024-07-30 13:50:02,431 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:02,431 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[191/2067], cost time 1.5520s, every example cost time is 1.5520, generate speed: 12.8868 tokens/s, avg speed: 10.0395 tokens/s, remaining time: 0:42:10 +pred is: + ['Mars'] + label is: + ['communications from another planet'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:50:02,514 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:02,514 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 91, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:02,515 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:02,515 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:02,515 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:03,456 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:03,488 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:03,519 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:03,550 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:03,552 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0371732711791992 s; generated tokens: 4 tokens; generate speed: 3.8566362160994156 tokens/s +2024-07-30 13:50:03,557 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:03,557 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[192/2067], cost time 1.0483s, every example cost time is 1.0483, generate speed: 3.8158 tokens/s, avg speed: 10.0143 tokens/s, remaining time: 0:42:06 +pred is: + ['100000'] + label is: + ['$100,000'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:50:03,639 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:03,640 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 85, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:03,640 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:03,640 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:03,640 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:04,581 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:04,614 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:04,645 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:04,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:04,707 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:04,737 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:04,768 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:04,798 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:04,829 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:04,860 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:05,045 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.404123306274414 s; generated tokens: 16 tokens; generate speed: 11.395010629410526 tokens/s +2024-07-30 13:50:05,049 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:05,050 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[193/2067], cost time 1.4152s, every example cost time is 1.4152, generate speed: 11.3059 tokens/s, avg speed: 10.0213 tokens/s, remaining time: 0:42:05 +pred is: + ['1900'] + label is: + ['1900'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:50:05,140 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:05,140 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 77, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:05,140 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:05,141 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:05,141 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:06,081 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:06,113 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:06,145 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:06,176 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:06,207 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:06,237 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:06,268 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:06,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:06,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:06,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:06,667 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5258827209472656 s; generated tokens: 20 tokens; generate speed: 13.10716723208192 tokens/s +2024-07-30 13:50:06,672 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:06,672 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[194/2067], cost time 1.5375s, every example cost time is 1.5375, generate speed: 13.0084 tokens/s, avg speed: 10.0389 tokens/s, remaining time: 0:42:06 +pred is: + ['A trans-Atlantic wireless telecommunications facility known as Wardenclyffe'] + label is: + ['Wardenclyffe'] +The F1/Em of this example is: {'F1': 12.5, 'Em': 0.0} +2024-07-30 13:50:06,755 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:06,755 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 162, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:06,756 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:06,756 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:06,756 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:07,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:07,737 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:07,768 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:07,799 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:07,830 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:07,861 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:07,891 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:07,922 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:07,952 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:07,983 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:08,168 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4122750759124756 s; generated tokens: 16 tokens; generate speed: 11.329237676776494 tokens/s +2024-07-30 13:50:08,173 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:08,173 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[195/2067], cost time 1.4234s, every example cost time is 1.4234, generate speed: 11.2408 tokens/s, avg speed: 10.0454 tokens/s, remaining time: 0:42:05 +pred is: + ['Morgan'] + label is: + ['Morgan'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:50:08,255 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:08,256 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 227, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:08,256 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:08,256 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:08,257 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:09,199 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:09,231 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:09,263 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:09,293 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:09,324 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:09,355 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:09,386 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:09,418 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:09,449 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:09,480 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:09,797 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5399158000946045 s; generated tokens: 20 tokens; generate speed: 12.9877230941921 tokens/s +2024-07-30 13:50:09,802 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:09,802 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[196/2067], cost time 1.5514s, every example cost time is 1.5514, generate speed: 12.8913 tokens/s, avg speed: 10.0620 tokens/s, remaining time: 0:42:06 +pred is: + ['50'] + label is: + ['over 50 letters'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +2024-07-30 13:50:09,887 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:09,887 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 116, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:09,888 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:09,888 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:09,888 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:10,830 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:10,862 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:10,893 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:10,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:10,955 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:10,986 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:11,017 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:11,048 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:11,078 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:11,109 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:11,419 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5304152965545654 s; generated tokens: 20 tokens; generate speed: 13.06834820916005 tokens/s +2024-07-30 13:50:11,424 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:11,424 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[197/2067], cost time 1.5427s, every example cost time is 1.5427, generate speed: 12.9644 tokens/s, avg speed: 10.0789 tokens/s, remaining time: 0:42:06 +pred is: + ['200'] + label is: + ['200'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:50:11,506 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:11,507 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 231, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:11,507 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:11,507 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:11,508 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:12,451 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:12,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:12,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:12,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:12,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:12,609 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:12,640 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:12,670 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:12,701 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:12,732 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:13,011 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5035591125488281 s; generated tokens: 19 tokens; generate speed: 12.636683081778719 tokens/s +2024-07-30 13:50:13,016 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:13,017 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[198/2067], cost time 1.5150s, every example cost time is 1.5150, generate speed: 12.5412 tokens/s, avg speed: 10.0928 tokens/s, remaining time: 0:42:07 +pred is: + ['Steam'] + label is: + ['steam'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:50:13,099 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:13,100 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 165, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:13,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:13,100 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:13,100 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:14,043 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:14,074 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:14,105 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:14,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:14,166 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:14,197 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:14,228 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:14,259 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:14,290 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:14,321 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:14,630 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5295648574829102 s; generated tokens: 20 tokens; generate speed: 13.07561421940126 tokens/s +2024-07-30 13:50:14,635 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:14,635 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[199/2067], cost time 1.5408s, every example cost time is 1.5408, generate speed: 12.9801 tokens/s, avg speed: 10.1093 tokens/s, remaining time: 0:42:07 +pred is: + ['The application of electricity to the brain'] + label is: + ['application of electricity'] +The F1/Em of this example is: {'F1': 55.55555555555556, 'Em': 0.0} +2024-07-30 13:50:14,718 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:14,719 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 144, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:14,719 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:14,719 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:14,719 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:15,662 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:15,697 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:15,728 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:15,759 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:15,790 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:15,821 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:15,852 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:15,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:15,914 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:15,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:16,162 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4421699047088623 s; generated tokens: 17 tokens; generate speed: 11.787792786753425 tokens/s +2024-07-30 13:50:16,167 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:16,167 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[200/2067], cost time 1.4534s, every example cost time is 1.4534, generate speed: 11.6968 tokens/s, avg speed: 10.1178 tokens/s, remaining time: 0:42:07 +pred is: + ['Europe'] + label is: + ['overseas'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 73.5673729860925, Em score: 64.0, current_count: 200 +2024-07-30 13:50:16,292 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:16,292 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 225, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:16,293 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:16,293 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:16,293 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:17,237 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:17,270 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:17,301 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:17,333 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:17,364 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:17,394 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:17,425 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:17,456 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:17,487 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:17,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:17,838 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5444011688232422 s; generated tokens: 20 tokens; generate speed: 12.950003149271778 tokens/s +2024-07-30 13:50:17,867 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:17,868 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[201/2067], cost time 1.5805s, every example cost time is 1.5805, generate speed: 12.6545 tokens/s, avg speed: 10.1326 tokens/s, remaining time: 0:42:07 +pred is: + ['Electrical Experimenter'] + label is: + ['Electrical Experimenter'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:50:17,951 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:17,951 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 202, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:17,952 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:17,952 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:17,952 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:18,896 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:18,930 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:18,961 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:18,992 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:19,023 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:19,054 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:19,099 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:19,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:19,162 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:19,193 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:19,319 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3660924434661865 s; generated tokens: 14 tokens; generate speed: 10.24820836024669 tokens/s +2024-07-30 13:50:19,323 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:19,324 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[202/2067], cost time 1.3775s, every example cost time is 1.3775, generate speed: 10.1634 tokens/s, avg speed: 10.1327 tokens/s, remaining time: 0:42:06 +pred is: + ['Thomas Edison and Nikola Tesla'] + label is: + ['Thomas Edison and Nikola Tesla'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:50:19,406 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:19,406 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 150, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:19,407 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:19,407 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:19,407 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:20,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:20,383 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:20,414 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:20,446 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:20,477 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:20,508 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:20,539 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:20,570 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:20,601 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:20,632 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:20,849 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4411611557006836 s; generated tokens: 17 tokens; generate speed: 11.796043719853596 tokens/s +2024-07-30 13:50:20,853 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:20,854 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[203/2067], cost time 1.4524s, every example cost time is 1.4524, generate speed: 11.7050 tokens/s, avg speed: 10.1410 tokens/s, remaining time: 0:42:06 +pred is: + ['They were not given the award because of their animosity toward each other.'] + label is: + ['animosity toward each other'] +The F1/Em of this example is: {'F1': 42.42424242424242, 'Em': 0.0} +2024-07-30 13:50:20,938 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:20,938 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 96, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:20,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:20,939 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:20,939 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:21,881 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:21,913 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:21,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:21,975 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:22,006 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:22,059 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:22,091 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:22,122 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:22,153 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:22,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:22,490 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5510029792785645 s; generated tokens: 20 tokens; generate speed: 12.894881742459853 tokens/s +2024-07-30 13:50:22,495 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:22,495 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[204/2067], cost time 1.5625s, every example cost time is 1.5625, generate speed: 12.8000 tokens/s, avg speed: 10.1560 tokens/s, remaining time: 0:42:06 +pred is: + ['38'] + label is: + ['38'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:50:22,576 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:22,576 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:22,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:22,577 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:22,577 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:23,519 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:23,551 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:23,582 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:23,613 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:23,667 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:23,699 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:23,730 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:23,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:23,791 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:23,822 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:24,130 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5523993968963623 s; generated tokens: 20 tokens; generate speed: 12.883282510921507 tokens/s +2024-07-30 13:50:24,134 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:24,135 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[205/2067], cost time 1.5634s, every example cost time is 1.5634, generate speed: 12.7930 tokens/s, avg speed: 10.1709 tokens/s, remaining time: 0:42:07 +pred is: + ['1655114'] + label is: + ['U.S. Patent 1,655,114'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:50:24,217 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:24,217 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 176, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:24,217 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:24,217 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:24,218 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:25,161 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:25,193 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:25,225 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:25,256 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:25,287 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:25,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:25,348 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:25,379 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:25,409 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:25,440 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:25,774 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5566186904907227 s; generated tokens: 20 tokens; generate speed: 12.848361722866771 tokens/s +2024-07-30 13:50:25,779 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:25,780 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[206/2067], cost time 1.5678s, every example cost time is 1.5678, generate speed: 12.7570 tokens/s, avg speed: 10.1853 tokens/s, remaining time: 0:42:07 +pred is: + ['125'] + label is: + ['$125 per month'] +The F1/Em of this example is: {'F1': 28.57142857142857, 'Em': 0.0} +2024-07-30 13:50:25,862 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:25,862 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 96, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:25,862 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:25,863 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:25,863 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:26,803 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:26,835 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:26,866 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:26,897 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:26,927 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:26,958 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:26,990 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:27,020 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:27,051 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:27,082 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:27,408 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5446593761444092 s; generated tokens: 20 tokens; generate speed: 12.947838409476118 tokens/s +2024-07-30 13:50:27,412 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:27,413 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[207/2067], cost time 1.5559s, every example cost time is 1.5559, generate speed: 12.8539 tokens/s, avg speed: 10.2001 tokens/s, remaining time: 0:42:08 +pred is: + ['1'] + label is: + ['mechanical energy'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:50:27,495 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:27,495 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 252, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:27,496 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:27,496 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:27,496 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:28,440 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:28,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:28,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:28,534 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:28,565 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:28,596 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:28,627 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:28,658 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:28,689 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:28,720 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:29,055 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5587983131408691 s; generated tokens: 20 tokens; generate speed: 12.830396229837717 tokens/s +2024-07-30 13:50:29,060 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:29,060 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[208/2067], cost time 1.5700s, every example cost time is 1.5700, generate speed: 12.7388 tokens/s, avg speed: 10.2142 tokens/s, remaining time: 0:42:08 +pred is: + ['Feed pigeons'] + label is: + ['feed the pigeons'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:50:29,143 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:29,144 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 107, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:29,144 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:29,144 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:29,144 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:30,086 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:30,118 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:30,150 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:30,180 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:30,211 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:30,214 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0689897537231445 s; generated tokens: 5 tokens; generate speed: 4.677313306872855 tokens/s +2024-07-30 13:50:30,218 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:30,219 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[209/2067], cost time 1.0801s, every example cost time is 1.0801, generate speed: 4.6294 tokens/s, avg speed: 10.1930 tokens/s, remaining time: 0:42:04 +pred is: + ['Teleforce weapon'] + label is: + ['"teleforce" weapon'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:50:30,301 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:30,301 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 133, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:30,302 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:30,302 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:30,302 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:31,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:31,276 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:31,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:31,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:31,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:31,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:31,431 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:31,461 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:31,492 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:31,523 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:31,848 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5456364154815674 s; generated tokens: 20 tokens; generate speed: 12.939653724300152 tokens/s +2024-07-30 13:50:31,853 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:31,853 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[210/2067], cost time 1.5569s, every example cost time is 1.5569, generate speed: 12.8462 tokens/s, avg speed: 10.2074 tokens/s, remaining time: 0:42:05 +pred is: + ['1937'] + label is: + ['1937'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 72.78319175340081, Em score: 62.857142857142854, current_count: 210 +2024-07-30 13:50:31,983 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:31,983 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 197, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:31,983 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:31,984 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:31,984 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:32,926 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:32,958 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:32,989 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:33,042 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:33,074 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:33,105 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:33,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:33,167 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:33,198 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:33,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:33,323 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3389909267425537 s; generated tokens: 13 tokens; generate speed: 9.708803652333856 tokens/s +2024-07-30 13:50:33,328 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:33,328 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[211/2067], cost time 1.3502s, every example cost time is 1.3502, generate speed: 9.6284 tokens/s, avg speed: 10.2047 tokens/s, remaining time: 0:42:03 +pred is: + ['Charged particle beam weapons'] + label is: + ['charged particle beam weapons'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:50:33,410 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:33,410 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 139, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:33,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:33,411 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:33,411 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:34,353 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:34,384 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:34,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:34,446 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:34,477 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:34,480 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0686790943145752 s; generated tokens: 5 tokens; generate speed: 4.678672977323355 tokens/s +2024-07-30 13:50:34,484 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:34,485 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[212/2067], cost time 1.0797s, every example cost time is 1.0797, generate speed: 4.6311 tokens/s, avg speed: 10.1838 tokens/s, remaining time: 0:42:00 +pred is: + ['Steal it'] + label is: + ['steal the invention'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:50:34,566 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:34,566 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 194, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:34,567 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:34,567 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:34,567 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:35,511 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:35,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:35,575 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:35,578 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.010920763015747 s; generated tokens: 3 tokens; generate speed: 2.9675916350263636 tokens/s +2024-07-30 13:50:35,583 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:35,583 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[213/2067], cost time 1.0219s, every example cost time is 1.0219, generate speed: 2.9357 tokens/s, avg speed: 10.1582 tokens/s, remaining time: 0:41:55 +pred is: + ['86'] + label is: + ['86'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:50:35,665 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:35,665 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 176, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:35,665 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:35,666 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:35,666 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:36,609 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:36,641 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:36,672 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:36,703 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:36,734 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:36,765 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:36,795 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:36,826 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:36,857 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:36,916 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:37,042 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3758397102355957 s; generated tokens: 14 tokens; generate speed: 10.175603957239082 tokens/s +2024-07-30 13:50:37,046 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:37,047 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[214/2067], cost time 1.3869s, every example cost time is 1.3869, generate speed: 10.0943 tokens/s, avg speed: 10.1579 tokens/s, remaining time: 0:41:54 +pred is: + ['They were seized by the FBI and stored in a warehouse.'] + label is: + ["FBI ordered the Alien Property Custodian to seize Tesla's belongings"] +The F1/Em of this example is: {'F1': 13.95348837209302, 'Em': 0.0} +2024-07-30 13:50:37,130 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:37,131 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 192, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:37,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:37,131 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:37,132 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:38,074 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:38,107 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:38,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:38,169 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:38,200 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:38,230 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:38,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:38,292 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:38,344 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:38,375 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:38,684 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.552093505859375 s; generated tokens: 20 tokens; generate speed: 12.885821585166834 tokens/s +2024-07-30 13:50:38,689 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:38,689 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[215/2067], cost time 1.5633s, every example cost time is 1.5633, generate speed: 12.7938 tokens/s, avg speed: 10.1720 tokens/s, remaining time: 0:41:55 +pred is: + ['Fiorello La Guardia'] + label is: + ['New York City mayor Fiorello La Guardia'] +The F1/Em of this example is: {'F1': 55.55555555555556, 'Em': 0.0} +2024-07-30 13:50:38,772 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:38,772 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 129, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:38,773 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:38,773 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:38,773 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:39,715 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:39,747 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:39,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:39,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:39,813 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0398645401000977 s; generated tokens: 4 tokens; generate speed: 3.846654872580768 tokens/s +2024-07-30 13:50:39,818 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:39,818 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[216/2067], cost time 1.0511s, every example cost time is 1.0511, generate speed: 3.8057 tokens/s, avg speed: 10.1491 tokens/s, remaining time: 0:41:51 +pred is: + ['Belgrade'] + label is: + ['Belgrade'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:50:39,900 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:39,900 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 146, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:39,900 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:39,901 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:39,901 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:40,842 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:40,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:40,906 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:40,909 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0078423023223877 s; generated tokens: 3 tokens; generate speed: 2.976656162464158 tokens/s +2024-07-30 13:50:40,913 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:40,914 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[217/2067], cost time 1.0189s, every example cost time is 1.0189, generate speed: 2.9443 tokens/s, avg speed: 10.1242 tokens/s, remaining time: 0:41:46 +pred is: + ['278'] + label is: + ['around 300'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:50:41,006 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:41,006 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 179, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:41,006 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:41,007 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:41,007 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:41,949 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:41,981 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:42,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:42,044 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:42,075 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:42,106 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:42,137 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:42,167 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:42,170 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1631569862365723 s; generated tokens: 8 tokens; generate speed: 6.877833426323844 tokens/s +2024-07-30 13:50:42,175 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:42,175 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[218/2067], cost time 1.1745s, every example cost time is 1.1745, generate speed: 6.8113 tokens/s, avg speed: 10.1110 tokens/s, remaining time: 0:41:43 +pred is: + ['8:10 p.m.'] + label is: + ['8:10 p.m'] +The F1/Em of this example is: {'F1': 90.9090909090909, 'Em': 0.0} +2024-07-30 13:50:42,256 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:42,257 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 84, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:42,257 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:42,257 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:42,258 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:43,199 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:43,231 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:43,262 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:43,265 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0073208808898926 s; generated tokens: 3 tokens; generate speed: 2.9781969746817167 tokens/s +2024-07-30 13:50:43,270 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:43,270 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[219/2067], cost time 1.0184s, every example cost time is 1.0184, generate speed: 2.9459 tokens/s, avg speed: 10.0864 tokens/s, remaining time: 0:41:39 +pred is: + ['8'] + label is: + ['between 8 to 10 miles per day'] +The F1/Em of this example is: {'F1': 14.285714285714288, 'Em': 0.0} +2024-07-30 13:50:43,363 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:43,364 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 134, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:43,364 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:43,364 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:43,365 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:44,306 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:44,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:44,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:44,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:44,431 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:44,462 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:44,493 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:44,524 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:44,554 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:44,585 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:44,897 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5324347019195557 s; generated tokens: 20 tokens; generate speed: 13.051127056146429 tokens/s +2024-07-30 13:50:44,902 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:44,902 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[220/2067], cost time 1.5438s, every example cost time is 1.5438, generate speed: 12.9549 tokens/s, avg speed: 10.1012 tokens/s, remaining time: 0:41:40 +pred is: + ['Telepathy'] + label is: + ['telepathy'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 72.31442780607554, Em score: 61.81818181818182, current_count: 220 +2024-07-30 13:50:45,033 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:45,034 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 127, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:45,034 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:45,034 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:45,035 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:45,976 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:46,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:46,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:46,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:46,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:46,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:46,161 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:46,192 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:46,223 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:46,254 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:46,563 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5277106761932373 s; generated tokens: 20 tokens; generate speed: 13.091484082467876 tokens/s +2024-07-30 13:50:46,567 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:46,567 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[221/2067], cost time 1.5388s, every example cost time is 1.5388, generate speed: 12.9969 tokens/s, avg speed: 10.1161 tokens/s, remaining time: 0:41:40 +pred is: + ['1'] + label is: + ['pigeons'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:50:46,650 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:46,650 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 111, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:46,650 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:46,650 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:46,651 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:47,593 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:47,625 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:47,656 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:47,687 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:47,690 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0386557579040527 s; generated tokens: 4 tokens; generate speed: 3.8511315896151856 tokens/s +2024-07-30 13:50:47,694 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:47,694 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[222/2067], cost time 1.0496s, every example cost time is 1.0496, generate speed: 3.8110 tokens/s, avg speed: 10.0941 tokens/s, remaining time: 0:41:36 +pred is: + ['142 pounds'] + label is: + ['142 pounds'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:50:47,776 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:47,776 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 267, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:47,777 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:47,777 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:47,777 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:48,721 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:48,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:48,784 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:48,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:48,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:48,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:48,908 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:48,939 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:48,970 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:49,001 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:49,004 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2267608642578125 s; generated tokens: 10 tokens; generate speed: 8.151547943331218 tokens/s +2024-07-30 13:50:49,009 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:49,009 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[223/2067], cost time 1.2378s, every example cost time is 1.2378, generate speed: 8.0787 tokens/s, avg speed: 10.0858 tokens/s, remaining time: 0:41:34 +pred is: + ['8'] + label is: + ['eight'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:50:49,091 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:49,091 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 219, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:49,091 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:49,092 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:49,092 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:50,035 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:50,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:50,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:50,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:50,163 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:50,194 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:50,224 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:50,255 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:50,286 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:50,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:50,627 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.535187005996704 s; generated tokens: 20 tokens; generate speed: 13.027728818623768 tokens/s +2024-07-30 13:50:50,632 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:50,632 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[224/2067], cost time 1.5464s, every example cost time is 1.5464, generate speed: 12.9331 tokens/s, avg speed: 10.1003 tokens/s, remaining time: 0:41:34 +pred is: + ['48 hours'] + label is: + ['more than 48 hours'] +The F1/Em of this example is: {'F1': 60.0, 'Em': 0.0} +2024-07-30 13:50:50,715 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:50,715 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 141, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:50,716 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:50,716 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:50,716 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:51,658 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:51,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:51,722 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:51,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:51,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:51,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:51,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:51,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:51,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:51,937 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:52,245 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5282008647918701 s; generated tokens: 20 tokens; generate speed: 13.087284833282602 tokens/s +2024-07-30 13:50:52,249 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:52,250 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[225/2067], cost time 1.5394s, every example cost time is 1.5394, generate speed: 12.9917 tokens/s, avg speed: 10.1150 tokens/s, remaining time: 0:41:34 +pred is: + ['Chastity'] + label is: + ['chastity'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:50:52,333 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:52,333 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 199, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:52,334 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:52,334 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:52,334 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:53,277 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:53,310 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:53,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:53,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:53,403 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:53,435 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:53,466 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:53,497 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:53,528 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:53,558 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:53,868 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5334203243255615 s; generated tokens: 20 tokens; generate speed: 13.042738303861027 tokens/s +2024-07-30 13:50:53,872 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:53,873 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[226/2067], cost time 1.5451s, every example cost time is 1.5451, generate speed: 12.9444 tokens/s, avg speed: 10.1292 tokens/s, remaining time: 0:41:34 +pred is: + ['Dorothy Skerrit'] + label is: + ['Dorothy Skerrit'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:50:53,955 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:53,955 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:53,956 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:53,956 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:53,956 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:54,899 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:54,931 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:54,968 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:54,999 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:55,030 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:55,033 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.076249122619629 s; generated tokens: 5 tokens; generate speed: 4.645764530641215 tokens/s +2024-07-30 13:50:55,037 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:55,038 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[227/2067], cost time 1.0874s, every example cost time is 1.0874, generate speed: 4.5981 tokens/s, avg speed: 10.1097 tokens/s, remaining time: 0:41:31 +pred is: + ['Mark Twain'] + label is: + ['Mark Twain'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:50:55,120 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:55,120 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 97, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:55,121 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:55,121 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:55,121 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:56,062 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:56,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:56,125 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:56,156 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:56,187 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:56,217 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:56,248 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:56,279 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:56,310 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:56,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:56,561 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4396295547485352 s; generated tokens: 17 tokens; generate speed: 11.808593359261401 tokens/s +2024-07-30 13:50:56,566 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:56,566 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[228/2067], cost time 1.4509s, every example cost time is 1.4509, generate speed: 11.7167 tokens/s, avg speed: 10.1172 tokens/s, remaining time: 0:41:30 +pred is: + ['Overweight people'] + label is: + ['overweight people'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:50:56,649 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:56,649 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 174, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:56,649 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:56,650 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:56,650 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:57,592 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:57,625 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:57,656 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:57,687 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:57,718 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:57,749 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:57,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:57,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:57,841 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:57,872 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:58,184 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5341808795928955 s; generated tokens: 20 tokens; generate speed: 13.036272493049923 tokens/s +2024-07-30 13:50:58,189 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:58,189 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[229/2067], cost time 1.5454s, every example cost time is 1.5454, generate speed: 12.9419 tokens/s, avg speed: 10.1313 tokens/s, remaining time: 0:41:30 +pred is: + ['electron'] + label is: + ['electron'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:50:58,271 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:58,272 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 76, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:58,272 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:58,272 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:58,273 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:50:59,214 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:59,245 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:59,276 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:59,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:59,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:59,368 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:59,399 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:59,430 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:59,463 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:59,501 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:59,813 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5402607917785645 s; generated tokens: 20 tokens; generate speed: 12.984814069639253 tokens/s +2024-07-30 13:50:59,818 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:50:59,818 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[230/2067], cost time 1.5515s, every example cost time is 1.5515, generate speed: 12.8909 tokens/s, avg speed: 10.1450 tokens/s, remaining time: 0:41:30 +pred is: + ['1'] + label is: + ["Einstein's"] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 72.03988746668097, Em score: 61.73913043478261, current_count: 230 +2024-07-30 13:50:59,951 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:50:59,951 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 163, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:50:59,952 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:50:59,952 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:50:59,952 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:00,894 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:00,927 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:00,958 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:00,989 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:01,020 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:01,051 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:01,082 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:01,113 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:01,143 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:01,174 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:01,452 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.499450445175171 s; generated tokens: 19 tokens; generate speed: 12.671309052684535 tokens/s +2024-07-30 13:51:01,457 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:01,457 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[231/2067], cost time 1.5107s, every example cost time is 1.5107, generate speed: 12.5773 tokens/s, avg speed: 10.1567 tokens/s, remaining time: 0:41:30 +pred is: + ['A theory of gravity'] + label is: + ['gravity'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 13:51:01,539 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:01,539 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 139, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:01,540 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:01,540 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:01,540 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:02,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:02,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:02,550 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:02,581 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:02,611 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:02,642 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:02,673 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:02,703 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:02,734 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:02,765 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:03,073 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.532696008682251 s; generated tokens: 20 tokens; generate speed: 13.048901991462207 tokens/s +2024-07-30 13:51:03,078 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:03,078 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[232/2067], cost time 1.5441s, every example cost time is 1.5441, generate speed: 12.9523 tokens/s, avg speed: 10.1704 tokens/s, remaining time: 0:41:30 +pred is: + ['The idea that humans\' "pity" had interfered with the natural "ruthless'] + label is: + ['eugenics'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:51:03,161 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:03,161 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 106, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:03,162 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:03,162 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:03,162 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:04,104 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:04,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:04,167 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:04,198 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:04,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:04,259 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:04,290 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:04,321 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:04,352 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:04,382 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:04,691 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5287094116210938 s; generated tokens: 20 tokens; generate speed: 13.082931162693203 tokens/s +2024-07-30 13:51:04,696 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:04,696 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[233/2067], cost time 1.5402s, every example cost time is 1.5402, generate speed: 12.9856 tokens/s, avg speed: 10.1841 tokens/s, remaining time: 0:41:31 +pred is: + ['Queen Bees'] + label is: + ['women'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:51:04,778 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:04,778 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 117, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:04,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:04,779 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:04,779 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:05,720 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:05,752 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:05,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:05,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:05,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:05,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:05,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:05,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:05,969 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:06,000 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:06,307 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.527773380279541 s; generated tokens: 20 tokens; generate speed: 13.090946771399135 tokens/s +2024-07-30 13:51:06,312 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:06,313 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[234/2067], cost time 1.5393s, every example cost time is 1.5393, generate speed: 12.9925 tokens/s, avg speed: 10.1977 tokens/s, remaining time: 0:41:31 +pred is: + ['1'] + label is: + ['post-World War I'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:51:06,394 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:06,395 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 94, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:06,395 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:06,395 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:06,396 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:07,337 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:07,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:07,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:07,431 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:07,462 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:07,493 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:07,523 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:07,554 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:07,585 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:07,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:07,801 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4052281379699707 s; generated tokens: 16 tokens; generate speed: 11.386051536879997 tokens/s +2024-07-30 13:51:07,806 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:07,806 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[235/2067], cost time 1.4165s, every example cost time is 1.4165, generate speed: 11.2956 tokens/s, avg speed: 10.2026 tokens/s, remaining time: 0:41:30 +pred is: + ['Orthodox Christianity'] + label is: + ['Orthodox Christian'] +The F1/Em of this example is: {'F1': 66.66666666666666, 'Em': 0.0} +2024-07-30 13:51:07,889 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:07,889 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 85, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:07,889 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:07,890 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:07,890 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:08,830 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:08,862 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:08,893 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:08,925 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:08,956 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:08,987 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:09,017 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:09,048 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:09,079 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:09,111 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:09,144 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2540159225463867 s; generated tokens: 11 tokens; generate speed: 8.771818445226403 tokens/s +2024-07-30 13:51:09,149 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:09,149 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[236/2067], cost time 1.2651s, every example cost time is 1.2651, generate speed: 8.6950 tokens/s, avg speed: 10.1967 tokens/s, remaining time: 0:41:28 +pred is: + ['A Machine to End War'] + label is: + ['"A Machine to End War"'] +The F1/Em of this example is: {'F1': 90.0, 'Em': 0.0} +2024-07-30 13:51:09,232 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:09,232 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 102, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:09,232 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:09,232 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:09,233 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:10,174 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:10,207 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:10,237 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:10,240 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0073966979980469 s; generated tokens: 3 tokens; generate speed: 2.9779728342983076 tokens/s +2024-07-30 13:51:10,245 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:10,245 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[237/2067], cost time 1.0185s, every example cost time is 1.0185, generate speed: 2.9455 tokens/s, avg speed: 10.1737 tokens/s, remaining time: 0:41:24 +pred is: + ['books'] + label is: + ['books and articles'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +2024-07-30 13:51:10,332 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:10,333 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 115, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:10,333 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:10,333 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:10,334 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:11,275 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:11,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:11,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:11,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:11,399 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:11,430 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:11,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:11,491 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:11,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:11,553 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:11,769 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.435317039489746 s; generated tokens: 17 tokens; generate speed: 11.844073143619534 tokens/s +2024-07-30 13:51:11,774 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:11,774 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[238/2067], cost time 1.4469s, every example cost time is 1.4469, generate speed: 11.7490 tokens/s, avg speed: 10.1808 tokens/s, remaining time: 0:41:23 +pred is: + ['1'] + label is: + ['the web'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:51:11,856 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:11,856 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 94, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:11,857 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:11,857 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:11,857 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:12,798 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:12,829 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:12,860 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:12,891 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:12,922 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:12,953 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:12,984 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:13,014 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:13,045 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:13,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:13,386 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5280280113220215 s; generated tokens: 20 tokens; generate speed: 13.08876529213386 tokens/s +2024-07-30 13:51:13,390 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:13,391 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[239/2067], cost time 1.5393s, every example cost time is 1.5393, generate speed: 12.9929 tokens/s, avg speed: 10.1941 tokens/s, remaining time: 0:41:23 +pred is: + ['1'] + label is: + ['science fiction'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:51:13,472 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:13,473 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 111, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:13,473 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:13,473 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:13,474 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:14,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:14,447 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:14,478 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:14,508 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:14,539 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:14,570 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:14,600 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:14,631 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:14,662 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:14,693 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:15,002 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5278592109680176 s; generated tokens: 20 tokens; generate speed: 13.09021136006926 tokens/s +2024-07-30 13:51:15,006 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:15,007 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[240/2067], cost time 1.5391s, every example cost time is 1.5391, generate speed: 12.9945 tokens/s, avg speed: 10.2073 tokens/s, remaining time: 0:41:23 +pred is: + ['Time'] + label is: + ['Time magazine'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +F1 score: 70.14239215556925, Em score: 59.166666666666664, current_count: 240 +2024-07-30 13:51:15,143 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:15,143 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 140, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:15,143 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:15,144 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:15,144 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:16,086 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:16,119 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:16,150 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:16,181 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:16,212 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:16,242 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:16,273 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:16,304 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:16,335 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:16,366 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:16,673 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5287432670593262 s; generated tokens: 20 tokens; generate speed: 13.08264142904242 tokens/s +2024-07-30 13:51:16,677 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:16,678 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[241/2067], cost time 1.5400s, every example cost time is 1.5400, generate speed: 12.9868 tokens/s, avg speed: 10.2204 tokens/s, remaining time: 0:41:23 +pred is: + ['A'] + label is: + ['Computational complexity theory'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:51:16,760 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:16,760 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 172, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:16,761 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:16,761 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:16,761 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:17,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:17,738 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:17,770 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:17,801 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:17,832 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:17,863 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:17,894 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:17,925 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:17,956 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:17,987 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:18,321 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.559727430343628 s; generated tokens: 20 tokens; generate speed: 12.822753265032816 tokens/s +2024-07-30 13:51:18,326 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:18,326 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[242/2067], cost time 1.5710s, every example cost time is 1.5710, generate speed: 12.7307 tokens/s, avg speed: 10.2323 tokens/s, remaining time: 0:41:23 +pred is: + ['A'] + label is: + ['if its solution requires significant resources'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:51:18,409 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:18,410 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 181, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:18,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:18,411 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:18,411 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:19,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:19,387 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:19,419 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:19,450 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:19,481 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:19,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:19,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:19,583 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:19,614 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:19,645 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:19,957 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5454554557800293 s; generated tokens: 20 tokens; generate speed: 12.941168847798016 tokens/s +2024-07-30 13:51:19,962 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:19,962 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[243/2067], cost time 1.5575s, every example cost time is 1.5575, generate speed: 12.8413 tokens/s, avg speed: 10.2446 tokens/s, remaining time: 0:41:23 +pred is: + ['1'] + label is: + ['analysis of algorithms and computability theory'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:51:20,044 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:20,044 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 213, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:20,045 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:20,045 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:20,045 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:20,989 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:21,021 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:21,052 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:21,083 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:21,114 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:21,162 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:21,194 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:21,225 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:21,256 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:21,287 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:21,597 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5511200428009033 s; generated tokens: 20 tokens; generate speed: 12.89390856163873 tokens/s +2024-07-30 13:51:21,601 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:21,602 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[244/2067], cost time 1.5624s, every example cost time is 1.5624, generate speed: 12.8006 tokens/s, avg speed: 10.2566 tokens/s, remaining time: 0:41:23 +pred is: + ['1'] + label is: + ['problem instance'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:51:21,684 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:21,684 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 166, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:21,684 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:21,685 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:21,685 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:22,627 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:22,660 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:22,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:22,722 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:22,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:22,784 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:22,815 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:22,846 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:22,877 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:22,908 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:23,236 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5511183738708496 s; generated tokens: 20 tokens; generate speed: 12.893922434874886 tokens/s +2024-07-30 13:51:23,241 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:23,241 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[245/2067], cost time 1.5623s, every example cost time is 1.5623, generate speed: 12.8014 tokens/s, avg speed: 10.2685 tokens/s, remaining time: 0:41:24 +pred is: + ['2000'] + label is: + ['2000'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:51:23,323 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:23,324 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 149, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:23,324 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:23,324 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:23,324 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:24,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:24,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:24,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:24,360 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:24,391 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:24,422 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:24,452 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:24,483 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:24,514 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:24,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:24,853 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5287103652954102 s; generated tokens: 20 tokens; generate speed: 13.082923001006257 tokens/s +2024-07-30 13:51:24,858 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:24,858 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[246/2067], cost time 1.5398s, every example cost time is 1.5398, generate speed: 12.9888 tokens/s, avg speed: 10.2810 tokens/s, remaining time: 0:41:24 +pred is: + ['1'] + label is: + ['problem instance'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:51:24,940 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:24,940 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 191, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:24,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:24,940 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:24,941 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:25,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:25,947 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:25,979 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:26,010 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:26,041 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:26,072 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:26,103 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:26,133 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:26,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:26,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:26,504 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.562856674194336 s; generated tokens: 20 tokens; generate speed: 12.797078791828525 tokens/s +2024-07-30 13:51:26,508 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:26,509 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[247/2067], cost time 1.5739s, every example cost time is 1.5739, generate speed: 12.7070 tokens/s, avg speed: 10.2923 tokens/s, remaining time: 0:41:24 +pred is: + ['Decision problems'] + label is: + ['Decision problems'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:51:26,590 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:26,591 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 127, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:26,591 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:26,591 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:26,591 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:27,533 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:27,589 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:27,621 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:27,652 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:27,683 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:27,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:27,745 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:27,776 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:27,806 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:27,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:28,146 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5548248291015625 s; generated tokens: 20 tokens; generate speed: 12.863185373465361 tokens/s +2024-07-30 13:51:28,151 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:28,152 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[248/2067], cost time 1.5660s, every example cost time is 1.5660, generate speed: 12.7712 tokens/s, avg speed: 10.3038 tokens/s, remaining time: 0:41:24 +pred is: + ['1'] + label is: + ['arbitrary graph'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:51:28,233 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:28,234 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 109, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:28,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:28,234 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:28,234 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:29,176 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:29,208 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:29,240 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:29,271 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:29,302 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:29,332 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:29,363 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:29,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:29,428 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:29,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:29,803 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.568490743637085 s; generated tokens: 20 tokens; generate speed: 12.751111271223142 tokens/s +2024-07-30 13:51:29,808 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:29,808 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[249/2067], cost time 1.5797s, every example cost time is 1.5797, generate speed: 12.6603 tokens/s, avg speed: 10.3147 tokens/s, remaining time: 0:41:24 +pred is: + ['A'] + label is: + ['a computational problem'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +2024-07-30 13:51:29,890 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:29,891 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 144, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:29,891 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:29,891 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:29,892 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:30,834 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:30,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:30,900 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:30,931 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:30,962 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:30,993 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:31,024 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:31,055 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:31,086 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:31,117 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:31,453 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5607640743255615 s; generated tokens: 20 tokens; generate speed: 12.814236519790741 tokens/s +2024-07-30 13:51:31,457 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:31,458 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[250/2067], cost time 1.5721s, every example cost time is 1.5721, generate speed: 12.7222 tokens/s, avg speed: 10.3258 tokens/s, remaining time: 0:41:24 +pred is: + ['1'] + label is: + ['decision problems'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 68.27002980267983, Em score: 57.6, current_count: 250 +2024-07-30 13:51:31,598 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:31,598 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 215, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:31,598 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:31,599 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:31,599 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:32,541 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:32,574 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:32,605 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:32,636 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:32,667 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:32,698 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:32,728 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:32,759 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:32,790 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:32,820 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:33,127 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5285098552703857 s; generated tokens: 20 tokens; generate speed: 13.084639219720373 tokens/s +2024-07-30 13:51:33,132 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:33,132 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[251/2067], cost time 1.5397s, every example cost time is 1.5397, generate speed: 12.9895 tokens/s, avg speed: 10.3377 tokens/s, remaining time: 0:41:24 +pred is: + ['1'] + label is: + ['how much time the best algorithm requires to solve the problem'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:51:33,215 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:33,215 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:33,216 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:33,216 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:33,216 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:34,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:34,192 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:34,223 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:34,254 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:34,285 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:34,316 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:34,346 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:34,378 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:34,408 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:34,439 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:34,747 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.530395269393921 s; generated tokens: 20 tokens; generate speed: 13.06851922504998 tokens/s +2024-07-30 13:51:34,751 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:34,752 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[252/2067], cost time 1.5415s, every example cost time is 1.5415, generate speed: 12.9744 tokens/s, avg speed: 10.3495 tokens/s, remaining time: 0:41:24 +pred is: + ["Cobham's"] + label is: + ["Cobham's thesis"] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 13:51:34,834 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:34,835 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 245, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:34,835 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:34,835 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:34,835 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:35,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:35,811 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:35,869 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:35,901 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:35,932 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:35,963 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:35,993 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:36,024 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:36,055 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:36,086 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:36,394 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5585806369781494 s; generated tokens: 20 tokens; generate speed: 12.832188162414846 tokens/s +2024-07-30 13:51:36,399 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:36,399 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[253/2067], cost time 1.5698s, every example cost time is 1.5698, generate speed: 12.7408 tokens/s, avg speed: 10.3604 tokens/s, remaining time: 0:41:24 +pred is: + ['Turing machine'] + label is: + ['A Turing machine'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 13:51:36,483 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:36,483 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 244, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:36,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:36,484 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:36,484 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:37,428 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:37,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:37,491 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:37,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:37,553 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:37,609 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:37,640 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:37,671 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:37,701 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:37,732 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:38,041 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5571208000183105 s; generated tokens: 20 tokens; generate speed: 12.84421863722122 tokens/s +2024-07-30 13:51:38,046 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:38,046 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[254/2067], cost time 1.5683s, every example cost time is 1.5683, generate speed: 12.7528 tokens/s, avg speed: 10.3711 tokens/s, remaining time: 0:41:24 +pred is: + ['A'] + label is: + ['A deterministic Turing machine'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 13:51:38,128 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:38,129 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 122, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:38,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:38,129 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:38,130 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:39,071 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:39,103 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:39,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:39,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:39,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:39,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:39,256 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:39,287 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:39,318 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:39,348 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:39,668 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5383026599884033 s; generated tokens: 20 tokens; generate speed: 13.001342661756023 tokens/s +2024-07-30 13:51:39,673 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:39,673 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[255/2067], cost time 1.5496s, every example cost time is 1.5496, generate speed: 12.9068 tokens/s, avg speed: 10.3824 tokens/s, remaining time: 0:41:24 +pred is: + ['complexity classes'] + label is: + ['complexity classes'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:51:39,755 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:39,755 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 130, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:39,756 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:39,756 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:39,756 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:40,706 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:40,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:40,770 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:40,800 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:40,831 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:40,862 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:40,894 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:40,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:40,956 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:40,986 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:41,307 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5509216785430908 s; generated tokens: 20 tokens; generate speed: 12.895557703976165 tokens/s +2024-07-30 13:51:41,312 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:41,312 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[256/2067], cost time 1.5622s, every example cost time is 1.5622, generate speed: 12.8027 tokens/s, avg speed: 10.3931 tokens/s, remaining time: 0:41:24 +pred is: + ['1'] + label is: + ['random access machines'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:51:41,394 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:41,395 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 152, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:41,395 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:41,395 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:41,396 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:42,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:42,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:42,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:42,432 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:42,463 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:42,494 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:42,525 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:42,555 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:42,590 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:42,621 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:42,930 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5338821411132812 s; generated tokens: 20 tokens; generate speed: 13.03881143402852 tokens/s +2024-07-30 13:51:42,934 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:42,935 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[257/2067], cost time 1.5450s, every example cost time is 1.5450, generate speed: 12.9451 tokens/s, avg speed: 10.4043 tokens/s, remaining time: 0:41:24 +pred is: + ['A'] + label is: + ['non-deterministic'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:51:43,017 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:43,017 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 243, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:43,017 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:43,018 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:43,018 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:43,961 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:43,994 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:44,025 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:44,056 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:44,087 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:44,118 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:44,149 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:44,180 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:44,211 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:44,245 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:44,556 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5376458168029785 s; generated tokens: 20 tokens; generate speed: 13.00689650467318 tokens/s +2024-07-30 13:51:44,560 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:44,561 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[258/2067], cost time 1.5488s, every example cost time is 1.5488, generate speed: 12.9130 tokens/s, avg speed: 10.4153 tokens/s, remaining time: 0:41:24 +pred is: + ['D'] + label is: + ['state transitions'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:51:44,643 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:44,643 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 117, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:44,644 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:44,644 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:44,644 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:45,586 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:45,619 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:45,655 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:45,686 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:45,717 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:45,748 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:45,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:45,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:45,841 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:45,872 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:46,058 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4131009578704834 s; generated tokens: 16 tokens; generate speed: 11.322616343075515 tokens/s +2024-07-30 13:51:46,062 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:46,063 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[259/2067], cost time 1.4242s, every example cost time is 1.4242, generate speed: 11.2340 tokens/s, avg speed: 10.4186 tokens/s, remaining time: 0:41:23 +pred is: + ['A'] + label is: + ['complexity resources'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:51:46,145 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:46,145 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 103, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:46,145 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:46,146 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:46,146 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:47,088 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:47,120 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:47,151 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:47,182 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:47,213 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:47,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:47,275 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:47,278 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1317098140716553 s; generated tokens: 7 tokens; generate speed: 6.185331180274441 tokens/s +2024-07-30 13:51:47,282 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:47,283 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[260/2067], cost time 1.1427s, every example cost time is 1.1427, generate speed: 6.1256 tokens/s, avg speed: 10.4048 tokens/s, remaining time: 0:41:20 +pred is: + ['Best, worst, average'] + label is: + ['best, worst and average'] +The F1/Em of this example is: {'F1': 53.333333333333336, 'Em': 0.0} +F1 score: 66.90707993847418, Em score: 55.76923076923077, current_count: 260 +2024-07-30 13:51:47,429 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:47,429 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 162, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:47,430 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:47,430 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:47,430 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:48,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:48,405 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:48,436 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:48,467 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:48,498 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:48,501 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0708229541778564 s; generated tokens: 5 tokens; generate speed: 4.6693059580879455 tokens/s +2024-07-30 13:51:48,506 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:48,506 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[261/2067], cost time 1.0821s, every example cost time is 1.0821, generate speed: 4.6205 tokens/s, avg speed: 10.3873 tokens/s, remaining time: 0:41:16 +pred is: + ['The worst-case'] + label is: + ['deterministic sorting algorithm quicksort'] +The F1/Em of this example is: {'F1': 20.0, 'Em': 0.0} +2024-07-30 13:51:48,588 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:48,588 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 245, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:48,589 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:48,589 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:48,589 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:49,533 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:49,565 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:49,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:49,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:49,677 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:49,708 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:49,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:49,769 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:49,801 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:49,831 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:50,141 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5515353679656982 s; generated tokens: 20 tokens; generate speed: 12.89045703561568 tokens/s +2024-07-30 13:51:50,146 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:50,146 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[262/2067], cost time 1.5627s, every example cost time is 1.5627, generate speed: 12.7985 tokens/s, avg speed: 10.3978 tokens/s, remaining time: 0:41:16 +pred is: + ['The complexity of an algorithm '] + label is: + ['the most efficient algorithm'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 13:51:50,229 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:50,229 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 121, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:50,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:50,229 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:50,230 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:51,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:51,203 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:51,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:51,264 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:51,301 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:51,304 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0745162963867188 s; generated tokens: 5 tokens; generate speed: 4.653256555357536 tokens/s +2024-07-30 13:51:51,309 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:51,309 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[263/2067], cost time 1.0855s, every example cost time is 1.0855, generate speed: 4.6060 tokens/s, avg speed: 10.3804 tokens/s, remaining time: 0:41:13 +pred is: + ['Big O notation'] + label is: + ['big O notation'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:51:51,391 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:51,392 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 79, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:51,392 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:51,392 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:51,392 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:52,333 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:52,366 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:52,399 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:52,430 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:52,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:52,491 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:52,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:52,553 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:52,584 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:52,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:52,922 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5291922092437744 s; generated tokens: 20 tokens; generate speed: 13.078800610611614 tokens/s +2024-07-30 13:51:52,927 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:52,927 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[264/2067], cost time 1.5404s, every example cost time is 1.5404, generate speed: 12.9833 tokens/s, avg speed: 10.3915 tokens/s, remaining time: 0:41:13 +pred is: + ['A'] + label is: + ['complexity classes'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:51:53,009 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:53,010 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 204, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:53,010 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:53,010 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:53,011 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:53,953 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:53,986 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:54,017 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:54,049 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:54,080 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:54,110 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:54,141 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:54,172 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:54,203 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:54,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:54,544 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5328896045684814 s; generated tokens: 20 tokens; generate speed: 13.04725398384454 tokens/s +2024-07-30 13:51:54,548 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:54,549 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[265/2067], cost time 1.5441s, every example cost time is 1.5441, generate speed: 12.9524 tokens/s, avg speed: 10.4023 tokens/s, remaining time: 0:41:12 +pred is: + ['1'] + label is: + ['chosen machine model'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:51:54,631 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:54,631 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 86, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:54,631 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:54,632 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:54,632 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:55,573 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:55,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:55,638 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:55,669 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:55,700 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:55,730 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:55,761 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:55,792 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:55,822 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:55,853 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:56,165 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5326800346374512 s; generated tokens: 20 tokens; generate speed: 13.049037990979581 tokens/s +2024-07-30 13:51:56,169 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:56,170 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[266/2067], cost time 1.5439s, every example cost time is 1.5439, generate speed: 12.9544 tokens/s, avg speed: 10.4131 tokens/s, remaining time: 0:41:12 +pred is: + ['1'] + label is: + ['time or space'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:51:56,253 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:56,253 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 139, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:56,253 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:56,254 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:56,254 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:57,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:57,228 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:57,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:57,289 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:57,320 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:57,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:57,381 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:57,412 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:57,443 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:57,474 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:57,784 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5295422077178955 s; generated tokens: 20 tokens; generate speed: 13.07580784569545 tokens/s +2024-07-30 13:51:57,788 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:57,789 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[267/2067], cost time 1.5407s, every example cost time is 1.5407, generate speed: 12.9811 tokens/s, avg speed: 10.4239 tokens/s, remaining time: 0:41:12 +pred is: + ['BPP, ZPP and RP'] + label is: + ['BPP, ZPP and RP'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:51:57,871 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:57,871 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 227, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:57,872 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:57,872 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:57,872 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:51:58,815 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:58,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:58,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:58,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:58,941 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:58,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:59,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:59,033 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:59,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:59,095 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:59,407 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5349369049072266 s; generated tokens: 20 tokens; generate speed: 13.029851543773276 tokens/s +2024-07-30 13:51:59,412 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:51:59,412 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[268/2067], cost time 1.5461s, every example cost time is 1.5461, generate speed: 12.9360 tokens/s, avg speed: 10.4344 tokens/s, remaining time: 0:41:12 +pred is: + ['1'] + label is: + ['computation time'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:51:59,501 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:51:59,501 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 103, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:51:59,502 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:51:59,502 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:51:59,502 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:00,444 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:00,477 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:00,509 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:00,541 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:00,571 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:00,602 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:00,633 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:00,663 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:00,694 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:00,725 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:01,034 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5315818786621094 s; generated tokens: 20 tokens; generate speed: 13.058394251485074 tokens/s +2024-07-30 13:52:01,039 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:01,039 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[269/2067], cost time 1.5431s, every example cost time is 1.5431, generate speed: 12.9612 tokens/s, avg speed: 10.4450 tokens/s, remaining time: 0:41:12 +pred is: + ['1'] + label is: + ['time and space hierarchy theorems'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:52:01,122 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:01,122 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 168, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:01,122 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:01,123 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:01,123 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:02,067 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:02,102 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:02,133 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:02,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:02,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:02,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:02,256 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:02,287 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:02,318 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:02,348 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:02,657 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5337140560150146 s; generated tokens: 20 tokens; generate speed: 13.04024040306781 tokens/s +2024-07-30 13:52:02,662 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:02,662 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[270/2067], cost time 1.5452s, every example cost time is 1.5452, generate speed: 12.9434 tokens/s, avg speed: 10.4554 tokens/s, remaining time: 0:41:11 +pred is: + ['reduction'] + label is: + ['reduction'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 65.7068177185307, Em score: 54.81481481481482, current_count: 270 +2024-07-30 13:52:02,808 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:02,809 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 147, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:02,809 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:02,809 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:02,810 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:03,752 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:03,786 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:03,789 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 0.9793963432312012 s; generated tokens: 2 tokens; generate speed: 2.0420741958272455 tokens/s +2024-07-30 13:52:03,794 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:03,794 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[271/2067], cost time 0.9914s, every example cost time is 0.9914, generate speed: 2.0173 tokens/s, avg speed: 10.4329 tokens/s, remaining time: 0:41:07 +pred is: + ['A'] + label is: + ['polynomial-time reduction'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:52:03,876 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:03,876 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 159, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:03,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:03,877 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:03,877 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:04,820 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:04,852 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:04,884 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:04,915 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:04,946 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:04,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:05,008 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:05,039 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:05,070 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:05,101 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:05,411 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5342226028442383 s; generated tokens: 20 tokens; generate speed: 13.035917971044581 tokens/s +2024-07-30 13:52:05,417 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:05,417 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[272/2067], cost time 1.5462s, every example cost time is 1.5462, generate speed: 12.9346 tokens/s, avg speed: 10.4433 tokens/s, remaining time: 0:41:07 +pred is: + ['1'] + label is: + ['the type of reduction being used'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:52:05,500 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:05,500 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 237, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:05,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:05,501 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:05,501 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:06,445 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:06,477 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:06,509 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:06,540 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:06,571 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:06,602 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:06,633 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:06,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:06,694 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:06,725 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:07,039 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.538055658340454 s; generated tokens: 20 tokens; generate speed: 13.0034305920891 tokens/s +2024-07-30 13:52:07,044 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:07,044 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[273/2067], cost time 1.5493s, every example cost time is 1.5493, generate speed: 12.9088 tokens/s, avg speed: 10.4534 tokens/s, remaining time: 0:41:07 +pred is: + ['NP-complete'] + label is: + ['NP-complete'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:52:07,126 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:07,126 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 163, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:07,127 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:07,127 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:07,127 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:08,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:08,102 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:08,106 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 0.9784696102142334 s; generated tokens: 2 tokens; generate speed: 2.0440082953236587 tokens/s +2024-07-30 13:52:08,110 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:08,111 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[274/2067], cost time 0.9898s, every example cost time is 0.9898, generate speed: 2.0207 tokens/s, avg speed: 10.4313 tokens/s, remaining time: 0:41:03 +pred is: + ['P'] + label is: + ['P'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:52:08,193 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:08,193 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 178, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:08,194 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:08,194 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:08,194 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:09,137 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:09,169 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:09,200 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:09,231 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:09,262 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:09,293 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:09,324 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:09,355 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:09,389 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:09,420 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:09,740 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5457487106323242 s; generated tokens: 20 tokens; generate speed: 12.938713687698007 tokens/s +2024-07-30 13:52:09,745 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:09,745 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[275/2067], cost time 1.5573s, every example cost time is 1.5573, generate speed: 12.8426 tokens/s, avg speed: 10.4412 tokens/s, remaining time: 0:41:03 +pred is: + ['1'] + label is: + ['more efficient solutions'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:52:09,828 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:09,828 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 139, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:09,828 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:09,828 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:09,829 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:10,770 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:10,802 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:10,834 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:10,865 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:10,896 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:10,927 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:10,957 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:10,988 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:11,019 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:11,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:11,360 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5312976837158203 s; generated tokens: 20 tokens; generate speed: 13.060817770891124 tokens/s +2024-07-30 13:52:11,365 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:11,366 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[276/2067], cost time 1.5428s, every example cost time is 1.5428, generate speed: 12.9631 tokens/s, avg speed: 10.4514 tokens/s, remaining time: 0:41:03 +pred is: + ['1'] + label is: + ['Ladner'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:52:11,447 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:11,448 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 207, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:11,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:11,448 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:11,449 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:12,392 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:12,425 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:12,456 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:12,487 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:12,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:12,549 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:12,580 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:12,611 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:12,642 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:12,672 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:12,980 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5311670303344727 s; generated tokens: 20 tokens; generate speed: 13.061932241077017 tokens/s +2024-07-30 13:52:12,985 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:12,985 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[277/2067], cost time 1.5425s, every example cost time is 1.5425, generate speed: 12.9660 tokens/s, avg speed: 10.4616 tokens/s, remaining time: 0:41:02 +pred is: + ['graph isomorphism problem'] + label is: + ['The graph isomorphism problem'] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +2024-07-30 13:52:13,068 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:13,068 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 270, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:13,068 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:13,069 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:13,069 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:14,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:14,046 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:14,078 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:14,109 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:14,140 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:14,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:14,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:14,233 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:14,264 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:14,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:14,604 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.534973382949829 s; generated tokens: 20 tokens; generate speed: 13.029541894443197 tokens/s +2024-07-30 13:52:14,609 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:14,609 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[278/2067], cost time 1.5462s, every example cost time is 1.5462, generate speed: 12.9345 tokens/s, avg speed: 10.4716 tokens/s, remaining time: 0:41:02 +pred is: + ['1'] + label is: + ['The integer factorization problem'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:52:14,691 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:14,691 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 176, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:14,692 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:14,692 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:14,692 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:15,635 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:15,668 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:15,700 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:15,731 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:15,762 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:15,793 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:15,824 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:15,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:15,885 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:15,917 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:16,228 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.535186767578125 s; generated tokens: 20 tokens; generate speed: 13.027730841864626 tokens/s +2024-07-30 13:52:16,232 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:16,233 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[279/2067], cost time 1.5464s, every example cost time is 1.5464, generate speed: 12.9335 tokens/s, avg speed: 10.4815 tokens/s, remaining time: 0:41:02 +pred is: + ['P ≠ NP'] + label is: + ['suspected to be unequal'] +The F1/Em of this example is: {'F1': 16.666666666666664, 'Em': 0.0} +2024-07-30 13:52:16,315 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:16,315 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 124, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:16,316 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:16,316 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:16,316 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:17,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:17,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:17,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:17,360 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:17,363 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0466992855072021 s; generated tokens: 4 tokens; generate speed: 3.8215369546772053 tokens/s +2024-07-30 13:52:17,368 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:17,368 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[280/2067], cost time 1.0578s, every example cost time is 1.0578, generate speed: 3.7814 tokens/s, avg speed: 10.4631 tokens/s, remaining time: 0:40:58 +pred is: + ['co-NP'] + label is: + ['co-NP'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.78871708572603, Em score: 53.92857142857143, current_count: 280 +2024-07-30 13:52:17,514 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:17,514 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 114, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:17,515 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:17,515 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:17,515 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:18,457 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:18,490 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:18,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:18,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:18,583 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:18,614 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:18,645 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:18,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:18,707 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:18,738 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:19,070 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5542006492614746 s; generated tokens: 20 tokens; generate speed: 12.868351335140417 tokens/s +2024-07-30 13:52:19,075 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:19,076 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[281/2067], cost time 1.5662s, every example cost time is 1.5662, generate speed: 12.7694 tokens/s, avg speed: 10.4725 tokens/s, remaining time: 0:40:58 +pred is: + ['L'] + label is: + ['L'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:52:19,157 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:19,157 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 350, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:19,158 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:19,158 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:19,158 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:20,104 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:20,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:20,168 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:20,199 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:20,230 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:20,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:20,292 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:20,323 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:20,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:20,385 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:20,696 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5379960536956787 s; generated tokens: 20 tokens; generate speed: 13.003934536725003 tokens/s +2024-07-30 13:52:20,701 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:20,701 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[282/2067], cost time 1.5492s, every example cost time is 1.5492, generate speed: 12.9100 tokens/s, avg speed: 10.4822 tokens/s, remaining time: 0:40:58 +pred is: + ['intractable'] + label is: + ['intractable problems'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:52:20,810 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:20,810 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 169, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:20,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:20,811 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:20,811 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:21,754 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:21,787 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:21,819 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:21,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:21,881 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:21,912 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:21,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:21,973 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:22,004 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:22,035 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:22,343 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5323460102081299 s; generated tokens: 20 tokens; generate speed: 13.051882451329327 tokens/s +2024-07-30 13:52:22,348 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:22,348 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[283/2067], cost time 1.5439s, every example cost time is 1.5439, generate speed: 12.9546 tokens/s, avg speed: 10.4920 tokens/s, remaining time: 0:40:57 +pred is: + ['Presburger'] + label is: + ['Presburger arithmetic'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:52:22,431 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:22,431 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 117, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:22,432 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:22,432 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:22,432 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:23,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:23,405 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:23,436 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:23,467 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:23,497 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:23,528 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:23,558 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:23,589 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:23,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:23,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:23,960 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5273947715759277 s; generated tokens: 20 tokens; generate speed: 13.094191738894391 tokens/s +2024-07-30 13:52:23,964 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:23,965 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[284/2067], cost time 1.5386s, every example cost time is 1.5386, generate speed: 12.9992 tokens/s, avg speed: 10.5018 tokens/s, remaining time: 0:40:57 +pred is: + ['A'] + label is: + ['foundations were laid out'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:52:24,047 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:24,047 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 150, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:24,047 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:24,048 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:24,048 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:24,990 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:25,022 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:25,053 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:25,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:25,115 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:25,146 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:25,177 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:25,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:25,259 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:25,291 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:25,599 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.550558090209961 s; generated tokens: 20 tokens; generate speed: 12.89858156639059 tokens/s +2024-07-30 13:52:25,603 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:25,604 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[285/2067], cost time 1.5617s, every example cost time is 1.5617, generate speed: 12.8064 tokens/s, avg speed: 10.5110 tokens/s, remaining time: 0:40:57 +pred is: + ['1'] + label is: + ['On the Computational Complexity of Algorithms'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:52:25,686 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:25,686 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 149, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:25,687 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:25,687 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:25,687 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:26,629 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:26,662 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:26,694 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:26,724 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:26,755 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:26,786 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:26,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:26,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:26,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:26,908 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:27,216 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5290250778198242 s; generated tokens: 20 tokens; generate speed: 13.080230200355642 tokens/s +2024-07-30 13:52:27,221 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:27,221 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[286/2067], cost time 1.5402s, every example cost time is 1.5402, generate speed: 12.9857 tokens/s, avg speed: 10.5207 tokens/s, remaining time: 0:40:57 +pred is: + ['John Myhill'] + label is: + ['John Myhill'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:52:27,304 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:27,304 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 110, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:27,305 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:27,305 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:27,305 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:28,247 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:28,280 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:28,311 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:28,342 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:28,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:28,403 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:28,434 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:28,466 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:28,497 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:28,528 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:28,836 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5311665534973145 s; generated tokens: 20 tokens; generate speed: 13.061936308834792 tokens/s +2024-07-30 13:52:28,841 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:28,841 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[287/2067], cost time 1.5423s, every example cost time is 1.5423, generate speed: 12.9677 tokens/s, avg speed: 10.5302 tokens/s, remaining time: 0:40:56 +pred is: + ['1'] + label is: + ['input encoding'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:52:28,948 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:28,948 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 179, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:28,948 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:28,949 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:28,949 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:29,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:29,925 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:29,976 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:30,008 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:30,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:30,070 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:30,101 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:30,132 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:30,163 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:30,194 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:30,505 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5563371181488037 s; generated tokens: 20 tokens; generate speed: 12.850686247070392 tokens/s +2024-07-30 13:52:30,510 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:30,510 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[288/2067], cost time 1.5679s, every example cost time is 1.5679, generate speed: 12.7556 tokens/s, avg speed: 10.5390 tokens/s, remaining time: 0:40:56 +pred is: + ['1'] + label is: + ['Manuel Blum'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:52:30,592 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:30,593 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 157, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:30,593 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:30,593 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:30,593 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:31,536 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:31,569 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:31,573 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 0.9794576168060303 s; generated tokens: 2 tokens; generate speed: 2.0419464463627484 tokens/s +2024-07-30 13:52:31,578 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:31,578 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[289/2067], cost time 0.9905s, every example cost time is 0.9905, generate speed: 2.0191 tokens/s, avg speed: 10.5178 tokens/s, remaining time: 0:40:52 +pred is: + ['curriculum'] + label is: + ['the curriculum.'] +The F1/Em of this example is: {'F1': 40.0, 'Em': 0.0} +2024-07-30 13:52:31,661 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:31,662 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 87, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:31,662 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:31,662 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:31,662 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:32,604 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:32,636 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:32,667 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:32,698 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:32,729 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:32,732 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.069164514541626 s; generated tokens: 5 tokens; generate speed: 4.6765487742956084 tokens/s +2024-07-30 13:52:32,736 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:32,737 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[290/2067], cost time 1.0804s, every example cost time is 1.0804, generate speed: 4.6280 tokens/s, avg speed: 10.5019 tokens/s, remaining time: 0:40:49 +pred is: + ['Cultural factors'] + label is: + ['cultures'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 63.72703718621824, Em score: 52.758620689655174, current_count: 290 +2024-07-30 13:52:32,908 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:32,908 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 97, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:32,908 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:32,909 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:32,909 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:33,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:33,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:33,914 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:33,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:33,976 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:34,006 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:34,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:34,068 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:34,099 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:34,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:34,437 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5280027389526367 s; generated tokens: 20 tokens; generate speed: 13.088981773494018 tokens/s +2024-07-30 13:52:34,442 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:34,442 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[291/2067], cost time 1.5396s, every example cost time is 1.5396, generate speed: 12.9908 tokens/s, avg speed: 10.5114 tokens/s, remaining time: 0:40:49 +pred is: + ['A family member'] + label is: + ['family member'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 13:52:34,524 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:34,524 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 88, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:34,525 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:34,525 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:34,525 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:35,466 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:35,499 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:35,530 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:35,561 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:35,592 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:35,595 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0695116519927979 s; generated tokens: 5 tokens; generate speed: 4.6750308803869585 tokens/s +2024-07-30 13:52:35,600 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:35,600 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[292/2067], cost time 1.0805s, every example cost time is 1.0805, generate speed: 4.6275 tokens/s, avg speed: 10.4956 tokens/s, remaining time: 0:40:45 +pred is: + ['Spiritual leader'] + label is: + ['spiritual'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:52:35,682 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:35,682 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 110, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:35,682 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:35,683 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:35,683 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:36,625 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:36,657 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:36,689 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:36,719 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:36,750 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:36,781 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:36,811 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:36,842 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:36,873 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:36,903 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:37,233 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.550008773803711 s; generated tokens: 20 tokens; generate speed: 12.903152767916362 tokens/s +2024-07-30 13:52:37,238 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:37,238 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[293/2067], cost time 1.5611s, every example cost time is 1.5611, generate speed: 12.8111 tokens/s, avg speed: 10.5046 tokens/s, remaining time: 0:40:45 +pred is: + ['homeschooling'] + label is: + ['homeschooling'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:52:37,320 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:37,321 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 105, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:37,321 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:37,321 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:37,321 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:38,262 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:38,322 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:38,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:38,384 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:38,387 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.06559419631958 s; generated tokens: 4 tokens; generate speed: 3.7537741982974997 tokens/s +2024-07-30 13:52:38,392 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:38,392 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[294/2067], cost time 1.0766s, every example cost time is 1.0766, generate speed: 3.7154 tokens/s, avg speed: 10.4865 tokens/s, remaining time: 0:40:42 +pred is: + ['school functions'] + label is: + ['school functions'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:52:38,474 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:38,475 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 106, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:38,475 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:38,475 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:38,475 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:39,419 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:39,454 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:39,486 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:39,517 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:39,549 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:39,584 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:39,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:39,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:39,677 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:39,708 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:40,020 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.544661283493042 s; generated tokens: 20 tokens; generate speed: 12.947822421477873 tokens/s +2024-07-30 13:52:40,025 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:40,025 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[295/2067], cost time 1.5558s, every example cost time is 1.5558, generate speed: 12.8553 tokens/s, avg speed: 10.4956 tokens/s, remaining time: 0:40:42 +pred is: + ["Teacher's colleges"] + label is: + ["teacher's colleges"] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:52:40,107 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:40,107 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 176, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:40,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:40,108 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:40,108 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:41,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:41,083 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:41,114 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:41,168 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:41,200 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:41,231 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:41,262 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:41,293 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:41,324 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:41,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:41,388 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2793457508087158 s; generated tokens: 11 tokens; generate speed: 8.598144788495638 tokens/s +2024-07-30 13:52:41,392 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:41,393 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[296/2067], cost time 1.2904s, every example cost time is 1.2904, generate speed: 8.5246 tokens/s, avg speed: 10.4893 tokens/s, remaining time: 0:40:40 +pred is: + ['Teachers'] + label is: + ['members'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:52:41,475 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:41,475 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 88, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:41,475 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:41,476 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:41,476 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:42,416 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:42,449 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:42,481 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:42,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:42,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:42,546 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.06974196434021 s; generated tokens: 5 tokens; generate speed: 4.67402435977528 tokens/s +2024-07-30 13:52:42,550 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:42,551 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[297/2067], cost time 1.0807s, every example cost time is 1.0807, generate speed: 4.6266 tokens/s, avg speed: 10.4739 tokens/s, remaining time: 0:40:37 +pred is: + ['In a park'] + label is: + ['outdoors'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:52:42,632 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:42,633 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:42,633 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:42,633 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:42,634 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:43,576 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:43,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:43,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:43,670 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:43,700 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:43,731 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:43,762 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:43,793 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:43,824 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:43,855 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:44,165 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5308785438537598 s; generated tokens: 20 tokens; generate speed: 13.064393697525452 tokens/s +2024-07-30 13:52:44,169 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:44,170 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[298/2067], cost time 1.5420s, every example cost time is 1.5420, generate speed: 12.9698 tokens/s, avg speed: 10.4832 tokens/s, remaining time: 0:40:36 +pred is: + ['Informal'] + label is: + ['informal'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:52:44,252 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:44,253 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 102, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:44,253 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:44,253 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:44,253 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:45,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:45,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:45,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:45,292 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:45,323 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:45,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:45,385 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:45,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:45,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:45,479 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:45,787 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5329711437225342 s; generated tokens: 20 tokens; generate speed: 13.046559996839688 tokens/s +2024-07-30 13:52:45,791 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:45,792 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[299/2067], cost time 1.5441s, every example cost time is 1.5441, generate speed: 12.9521 tokens/s, avg speed: 10.4925 tokens/s, remaining time: 0:40:36 +pred is: + ['1'] + label is: + ['skill'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:52:45,873 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:45,874 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 278, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:45,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:45,874 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:45,875 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:46,818 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:46,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:46,881 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:46,912 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:46,943 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:46,946 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0712122917175293 s; generated tokens: 5 tokens; generate speed: 4.667608875158859 tokens/s +2024-07-30 13:52:46,951 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:46,951 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[300/2067], cost time 1.0823s, every example cost time is 1.0823, generate speed: 4.6200 tokens/s, avg speed: 10.4771 tokens/s, remaining time: 0:40:33 +pred is: + ['Educational levels'] + label is: + ['particular skills'] +The F1/Em of this example is: {'F1': 33.33333333333333, 'Em': 0.0} +F1 score: 63.463913724455416, Em score: 52.333333333333336, current_count: 300 +2024-07-30 13:52:47,101 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:47,101 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 157, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:47,101 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:47,102 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:47,102 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:48,044 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:48,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:48,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:48,139 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:48,170 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:48,201 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:48,231 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:48,262 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:48,293 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:48,324 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:48,450 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.347447395324707 s; generated tokens: 14 tokens; generate speed: 10.390016002536624 tokens/s +2024-07-30 13:52:48,454 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:48,455 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[301/2067], cost time 1.3587s, every example cost time is 1.3587, generate speed: 10.3037 tokens/s, avg speed: 10.4765 tokens/s, remaining time: 0:40:31 +pred is: + ['The relationship between teachers and children is closer in primary school.'] + label is: + ['the relationship between teachers and children'] +The F1/Em of this example is: {'F1': 66.66666666666666, 'Em': 0.0} +2024-07-30 13:52:48,537 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:48,538 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 165, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:48,538 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:48,538 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:48,538 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:49,481 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:49,513 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:49,548 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:49,579 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:49,610 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:49,641 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:49,672 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:49,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:49,734 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:49,765 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:49,952 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4138495922088623 s; generated tokens: 16 tokens; generate speed: 11.316621009879235 tokens/s +2024-07-30 13:52:49,957 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:49,957 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[302/2067], cost time 1.4251s, every example cost time is 1.4251, generate speed: 11.2271 tokens/s, avg speed: 10.4791 tokens/s, remaining time: 0:40:30 +pred is: + ['Alternative approaches for primary school are available that are different than the norm.'] + label is: + ['alternative'] +The F1/Em of this example is: {'F1': 7.4074074074074066, 'Em': 0.0} +2024-07-30 13:52:50,045 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:50,046 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 123, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:50,046 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:50,046 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:50,046 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:50,988 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:51,021 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:51,052 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:51,083 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:51,115 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:51,146 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:51,177 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:51,208 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:51,239 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:51,270 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:51,551 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.504251480102539 s; generated tokens: 19 tokens; generate speed: 12.630866747563275 tokens/s +2024-07-30 13:52:51,556 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:51,556 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[303/2067], cost time 1.5160s, every example cost time is 1.5160, generate speed: 12.5327 tokens/s, avg speed: 10.4866 tokens/s, remaining time: 0:40:29 +pred is: + ['Co-teaching'] + label is: + ['Co-teaching'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:52:51,638 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:51,638 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 94, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:51,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:51,639 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:51,639 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:52,580 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:52,612 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:52,643 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:52,674 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:52,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:52,735 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:52,766 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:52,797 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:52,828 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:52,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:53,166 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5270600318908691 s; generated tokens: 20 tokens; generate speed: 13.09706205540274 tokens/s +2024-07-30 13:52:53,171 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:53,171 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[304/2067], cost time 1.5382s, every example cost time is 1.5382, generate speed: 13.0022 tokens/s, avg speed: 10.4958 tokens/s, remaining time: 0:40:29 +pred is: + ['1'] + label is: + ['corporal punishment'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:52:53,254 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:53,254 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 141, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:53,254 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:53,255 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:53,255 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:54,197 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:54,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:54,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:54,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:54,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:54,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:54,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:54,423 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:54,454 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:54,485 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:54,763 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5075316429138184 s; generated tokens: 19 tokens; generate speed: 12.603383875429659 tokens/s +2024-07-30 13:52:54,767 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:54,768 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[305/2067], cost time 1.5187s, every example cost time is 1.5187, generate speed: 12.5107 tokens/s, avg speed: 10.5031 tokens/s, remaining time: 0:40:28 +pred is: + ['It was one of the most common forms of school discipline throughout much of the world.'] + label is: + ['one of the most common'] +The F1/Em of this example is: {'F1': 43.90243902439025, 'Em': 0.0} +2024-07-30 13:52:54,851 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:54,851 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 166, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:54,852 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:54,852 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:54,852 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:55,794 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:55,826 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:55,857 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:55,860 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.007295846939087 s; generated tokens: 3 tokens; generate speed: 2.978270990708667 tokens/s +2024-07-30 13:52:55,864 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:55,864 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[306/2067], cost time 1.0182s, every example cost time is 1.0182, generate speed: 2.9462 tokens/s, avg speed: 10.4848 tokens/s, remaining time: 0:40:25 +pred is: + ['30'] + label is: + ['30'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:52:55,945 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:55,946 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 83, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:55,946 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:55,946 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:55,947 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:56,887 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:56,920 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:56,951 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:56,982 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:57,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:57,044 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:57,075 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:57,105 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:57,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:57,166 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:57,477 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5301837921142578 s; generated tokens: 20 tokens; generate speed: 13.070325344621487 tokens/s +2024-07-30 13:52:57,482 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:57,482 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[307/2067], cost time 1.5412s, every example cost time is 1.5412, generate speed: 12.9766 tokens/s, avg speed: 10.4939 tokens/s, remaining time: 0:40:25 +pred is: + ['1'] + label is: + ['caning'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:52:57,563 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:57,564 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 147, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:57,564 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:57,565 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:57,565 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:58,506 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:58,538 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:58,570 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:58,601 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:58,604 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0391771793365479 s; generated tokens: 4 tokens; generate speed: 3.849199231408988 tokens/s +2024-07-30 13:52:58,609 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:52:58,609 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[308/2067], cost time 1.0504s, every example cost time is 1.0504, generate speed: 3.8081 tokens/s, avg speed: 10.4773 tokens/s, remaining time: 0:40:21 +pred is: + ['Detention'] + label is: + ['detention'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:52:58,697 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:52:58,698 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 139, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:52:58,698 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:58,698 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:52:58,699 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:52:59,641 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:59,674 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:59,707 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:59,738 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:59,769 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:59,800 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:59,830 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:59,861 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:59,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:52:59,923 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:00,230 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5311272144317627 s; generated tokens: 20 tokens; generate speed: 13.06227190757789 tokens/s +2024-07-30 13:53:00,235 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:00,235 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[309/2067], cost time 1.5426s, every example cost time is 1.5426, generate speed: 12.9650 tokens/s, avg speed: 10.4864 tokens/s, remaining time: 0:40:21 +pred is: + ['1'] + label is: + ['assertive'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:53:00,317 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:00,317 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 141, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:00,318 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:00,318 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:00,318 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:01,260 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:01,292 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:01,324 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:01,355 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:01,386 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:01,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:01,447 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:01,478 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:01,509 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:01,540 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:01,847 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5289483070373535 s; generated tokens: 20 tokens; generate speed: 13.080886978287738 tokens/s +2024-07-30 13:53:01,852 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:01,852 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[310/2067], cost time 1.5401s, every example cost time is 1.5401, generate speed: 12.9864 tokens/s, avg speed: 10.4954 tokens/s, remaining time: 0:40:20 +pred is: + ['1'] + label is: + ['some teachers and parents'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 62.765002033661574, Em score: 51.61290322580645, current_count: 310 +2024-07-30 13:53:02,006 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:02,006 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 145, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:02,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:02,007 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:02,007 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:02,949 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:02,981 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:03,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:03,043 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:03,074 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:03,105 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:03,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:03,166 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:03,197 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:03,228 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:03,541 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5339791774749756 s; generated tokens: 20 tokens; generate speed: 13.037986625686298 tokens/s +2024-07-30 13:53:03,546 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:03,546 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[311/2067], cost time 1.5453s, every example cost time is 1.5453, generate speed: 12.9425 tokens/s, avg speed: 10.5042 tokens/s, remaining time: 0:40:20 +pred is: + ['1'] + label is: + ['Japan'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:53:03,629 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:03,629 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 142, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:03,629 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:03,630 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:03,630 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:04,571 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:04,603 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:04,635 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:04,666 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:04,697 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:04,728 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:04,758 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:04,789 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:04,822 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:04,853 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:05,163 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.532893180847168 s; generated tokens: 20 tokens; generate speed: 13.047223544269935 tokens/s +2024-07-30 13:53:05,168 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:05,168 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[312/2067], cost time 1.5441s, every example cost time is 1.5441, generate speed: 12.9526 tokens/s, avg speed: 10.5130 tokens/s, remaining time: 0:40:20 +pred is: + ['40 to 50 students'] + label is: + ['40 to 50 students'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:53:05,251 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:05,251 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 224, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:05,251 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:05,252 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:05,252 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:06,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:06,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:06,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:06,289 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:06,320 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:06,352 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:06,387 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:06,419 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:06,450 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:06,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:06,791 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.539215326309204 s; generated tokens: 20 tokens; generate speed: 12.993633611976078 tokens/s +2024-07-30 13:53:06,796 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:06,796 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[313/2067], cost time 1.5504s, every example cost time is 1.5504, generate speed: 12.9002 tokens/s, avg speed: 10.5215 tokens/s, remaining time: 0:40:19 +pred is: + ['1'] + label is: + ['popularly based authority'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:53:06,878 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:06,879 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 199, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:06,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:06,879 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:06,880 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:07,822 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:07,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:07,885 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:07,916 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:07,947 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:07,950 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0703108310699463 s; generated tokens: 5 tokens; generate speed: 4.671540131011945 tokens/s +2024-07-30 13:53:07,955 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:07,955 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[314/2067], cost time 1.0814s, every example cost time is 1.0814, generate speed: 4.6235 tokens/s, avg speed: 10.5068 tokens/s, remaining time: 0:40:16 +pred is: + ['Enthusiasm'] + label is: + ['enthusiasm'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:53:08,037 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:08,038 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 166, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:08,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:08,038 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:08,039 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:08,980 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:09,012 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:09,043 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:09,074 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:09,077 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0380315780639648 s; generated tokens: 4 tokens; generate speed: 3.853447317528056 tokens/s +2024-07-30 13:53:09,081 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:09,082 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[315/2067], cost time 1.0491s, every example cost time is 1.0491, generate speed: 3.8128 tokens/s, avg speed: 10.4906 tokens/s, remaining time: 0:40:13 +pred is: + ['Teacher enthusiasm'] + label is: + ['teacher enthusiasm'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:53:09,164 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:09,164 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 216, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:09,165 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:09,165 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:09,165 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:10,109 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:10,141 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:10,173 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:10,205 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:10,236 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:10,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:10,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:10,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:10,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:10,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:10,704 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5386691093444824 s; generated tokens: 20 tokens; generate speed: 12.998246262655249 tokens/s +2024-07-30 13:53:10,709 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:10,709 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[316/2067], cost time 1.5499s, every example cost time is 1.5499, generate speed: 12.9042 tokens/s, avg speed: 10.4992 tokens/s, remaining time: 0:40:12 +pred is: + ['self-determined'] + label is: + ['self-determined'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:53:10,792 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:10,792 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 186, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:10,793 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:10,793 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:10,793 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:11,736 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:11,768 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:11,800 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:11,831 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:11,861 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:11,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:11,923 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:11,953 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:11,984 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:12,015 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:12,323 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5293238162994385 s; generated tokens: 20 tokens; generate speed: 13.077675105063584 tokens/s +2024-07-30 13:53:12,328 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:12,328 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[317/2067], cost time 1.5405s, every example cost time is 1.5405, generate speed: 12.9829 tokens/s, avg speed: 10.5080 tokens/s, remaining time: 0:40:12 +pred is: + ['1'] + label is: + ['student-teacher relationships'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:53:12,414 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:12,415 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 122, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:12,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:12,415 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:12,415 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:13,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:13,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:13,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:13,451 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:13,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:13,513 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:13,544 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:13,575 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:13,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:13,636 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:13,944 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5286900997161865 s; generated tokens: 20 tokens; generate speed: 13.083096439044878 tokens/s +2024-07-30 13:53:13,949 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:13,949 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[318/2067], cost time 1.5402s, every example cost time is 1.5402, generate speed: 12.9851 tokens/s, avg speed: 10.5167 tokens/s, remaining time: 0:40:11 +pred is: + ['1'] + label is: + ['friendly and supportive'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:53:14,033 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:14,033 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 219, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:14,034 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:14,034 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:14,034 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:14,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:15,009 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:15,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:15,071 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:15,102 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:15,133 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:15,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:15,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:15,198 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1631031036376953 s; generated tokens: 8 tokens; generate speed: 6.878152052882825 tokens/s +2024-07-30 13:53:15,202 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:15,203 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[319/2067], cost time 1.1744s, every example cost time is 1.1744, generate speed: 6.8118 tokens/s, avg speed: 10.5068 tokens/s, remaining time: 0:40:09 +pred is: + ['Enthusiasm about the students'] + label is: + ['enthusiasm about the students'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:53:15,286 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:15,286 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 129, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:15,286 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:15,287 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:15,287 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:16,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:16,262 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:16,293 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:16,324 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:16,355 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:16,386 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:16,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:16,447 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:16,478 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:16,509 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:16,815 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.528296709060669 s; generated tokens: 20 tokens; generate speed: 13.086464088699453 tokens/s +2024-07-30 13:53:16,820 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:16,820 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[320/2067], cost time 1.5394s, every example cost time is 1.5394, generate speed: 12.9917 tokens/s, avg speed: 10.5154 tokens/s, remaining time: 0:40:08 +pred is: + ['1'] + label is: + ['sexual misconduct'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 62.36609572010965, Em score: 51.5625, current_count: 320 +2024-07-30 13:53:16,977 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:16,977 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 278, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:16,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:16,978 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:16,978 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:17,921 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:17,954 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:17,985 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:18,016 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:18,047 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:18,078 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:18,109 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:18,140 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:18,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:18,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:18,451 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4730682373046875 s; generated tokens: 18 tokens; generate speed: 12.219393198603672 tokens/s +2024-07-30 13:53:18,456 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:18,456 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[321/2067], cost time 1.4845s, every example cost time is 1.4845, generate speed: 12.1250 tokens/s, avg speed: 10.5208 tokens/s, remaining time: 0:40:08 +pred is: + ['England'] + label is: + ['England'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:53:18,538 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:18,538 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 85, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:18,539 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:18,539 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:18,539 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:19,480 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:19,513 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:19,549 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:19,580 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:19,611 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:19,642 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:19,674 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:19,706 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:19,737 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:19,768 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:20,077 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5375001430511475 s; generated tokens: 20 tokens; generate speed: 13.008128871006335 tokens/s +2024-07-30 13:53:20,082 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:20,082 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[322/2067], cost time 1.5489s, every example cost time is 1.5489, generate speed: 12.9127 tokens/s, avg speed: 10.5292 tokens/s, remaining time: 0:40:07 +pred is: + ['1'] + label is: + ['United States'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:53:20,164 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:20,165 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 157, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:20,165 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:20,165 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:20,166 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:21,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:21,142 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:21,174 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:21,205 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:21,236 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:21,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:21,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:21,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:21,360 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:21,391 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:21,516 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3503799438476562 s; generated tokens: 14 tokens; generate speed: 10.367452555693035 tokens/s +2024-07-30 13:53:21,521 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:21,522 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[323/2067], cost time 1.3619s, every example cost time is 1.3619, generate speed: 10.2796 tokens/s, avg speed: 10.5284 tokens/s, remaining time: 0:40:06 +pred is: + ['They fear being labelled a pedophile or hebephile.'] + label is: + ['Fears of being labelled a pedophile or hebephile'] +The F1/Em of this example is: {'F1': 77.41935483870968, 'Em': 0.0} +2024-07-30 13:53:21,604 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:21,605 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 129, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:21,605 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:21,605 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:21,605 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:22,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:22,580 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:22,611 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:22,642 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:22,673 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:22,675 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0697791576385498 s; generated tokens: 5 tokens; generate speed: 4.673861856719187 tokens/s +2024-07-30 13:53:22,680 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:22,680 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[324/2067], cost time 1.0809s, every example cost time is 1.0809, generate speed: 4.6256 tokens/s, avg speed: 10.5141 tokens/s, remaining time: 0:40:03 +pred is: + ['Occupational stress'] + label is: + ['occupational stress'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:53:22,763 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:22,763 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 103, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:22,763 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:22,763 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:22,764 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:23,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:23,738 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:23,768 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:23,799 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:23,830 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:23,861 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:23,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:23,922 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:23,953 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:23,984 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:23,986 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.222482442855835 s; generated tokens: 10 tokens; generate speed: 8.180076579782243 tokens/s +2024-07-30 13:53:23,991 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:23,991 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[325/2067], cost time 1.2336s, every example cost time is 1.2336, generate speed: 8.1062 tokens/s, avg speed: 10.5075 tokens/s, remaining time: 0:40:01 +pred is: + ['42'] + label is: + ['42%'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:53:24,072 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:24,072 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 123, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:24,073 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:24,073 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:24,073 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:25,015 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:25,052 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:25,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:25,086 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.012981653213501 s; generated tokens: 3 tokens; generate speed: 2.9615541312945233 tokens/s +2024-07-30 13:53:25,091 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:25,091 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[326/2067], cost time 1.0241s, every example cost time is 1.0241, generate speed: 2.9293 tokens/s, avg speed: 10.4902 tokens/s, remaining time: 0:39:57 +pred is: + ['2'] + label is: + ['several'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:53:25,173 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:25,174 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 190, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:25,175 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:25,175 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:25,175 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:26,117 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:26,150 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:26,181 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:26,212 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:26,243 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:26,274 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:26,305 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:26,336 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:26,367 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:26,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:26,707 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5315132141113281 s; generated tokens: 20 tokens; generate speed: 13.058979717393525 tokens/s +2024-07-30 13:53:26,711 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:26,712 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[327/2067], cost time 1.5435s, every example cost time is 1.5435, generate speed: 12.9574 tokens/s, avg speed: 10.4987 tokens/s, remaining time: 0:39:57 +pred is: + ['In a university or college'] + label is: + ['a university or college'] +The F1/Em of this example is: {'F1': 87.50000000000001, 'Em': 0.0} +2024-07-30 13:53:26,794 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:26,794 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 104, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:26,795 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:26,795 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:26,795 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:27,737 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:27,769 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:27,801 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:27,832 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:27,862 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:27,893 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:27,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:27,955 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:27,986 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:28,016 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:28,324 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5291564464569092 s; generated tokens: 20 tokens; generate speed: 13.079106487985884 tokens/s +2024-07-30 13:53:28,329 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:28,330 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[328/2067], cost time 1.5404s, every example cost time is 1.5404, generate speed: 12.9838 tokens/s, avg speed: 10.5071 tokens/s, remaining time: 0:39:56 +pred is: + ['The individual states and territories'] + label is: + ['the individual states and territories'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:53:28,413 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:28,413 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 137, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:28,414 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:28,414 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:28,414 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:29,356 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:29,389 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:29,422 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:29,453 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:29,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:29,515 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:29,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:29,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:29,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:29,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:29,946 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5321669578552246 s; generated tokens: 20 tokens; generate speed: 13.053407722613095 tokens/s +2024-07-30 13:53:29,951 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:29,952 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[329/2067], cost time 1.5435s, every example cost time is 1.5435, generate speed: 12.9572 tokens/s, avg speed: 10.5155 tokens/s, remaining time: 0:39:56 +pred is: + ["Bachelor's Degree"] + label is: + ["a post-secondary degree Bachelor's Degree"] +The F1/Em of this example is: {'F1': 62.5, 'Em': 0.0} +2024-07-30 13:53:30,034 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:30,034 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 143, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:30,035 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:30,035 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:30,035 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:30,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:31,009 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:31,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:31,071 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:31,102 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:31,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:31,165 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:31,197 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:31,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:31,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:31,570 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5349972248077393 s; generated tokens: 20 tokens; generate speed: 13.029339517213154 tokens/s +2024-07-30 13:53:31,575 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:31,576 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[330/2067], cost time 1.5464s, every example cost time is 1.5464, generate speed: 12.9329 tokens/s, avg speed: 10.5237 tokens/s, remaining time: 0:39:55 +pred is: + ['Civil servants'] + label is: + ['civil servants'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.377484803859986, Em score: 51.21212121212121, current_count: 330 +2024-07-30 13:53:31,735 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:31,735 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 165, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:31,736 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:31,736 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:31,736 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:32,679 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:32,712 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:32,743 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:32,774 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:32,805 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:32,835 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:32,866 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:32,897 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:32,928 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:32,958 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:33,206 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4691452980041504 s; generated tokens: 18 tokens; generate speed: 12.252021651264306 tokens/s +2024-07-30 13:53:33,211 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:33,211 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[331/2067], cost time 1.4807s, every example cost time is 1.4807, generate speed: 12.1563 tokens/s, avg speed: 10.5290 tokens/s, remaining time: 0:39:54 +pred is: + ['Extra pay'] + label is: + ['Extra pay'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:53:33,293 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:33,294 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 102, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:33,294 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:33,294 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:33,295 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:34,236 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:34,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:34,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:34,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:34,360 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:34,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:34,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:34,452 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:34,483 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:34,514 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:34,821 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5265147686004639 s; generated tokens: 20 tokens; generate speed: 13.10174025917637 tokens/s +2024-07-30 13:53:34,826 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:34,827 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[332/2067], cost time 1.5379s, every example cost time is 1.5379, generate speed: 13.0051 tokens/s, avg speed: 10.5373 tokens/s, remaining time: 0:39:54 +pred is: + ['Teaching Council'] + label is: + ['the Teaching Council'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 13:53:34,909 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:34,909 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 111, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:34,909 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:34,910 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:34,910 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:35,852 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:35,884 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:35,915 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:35,946 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:35,976 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:36,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:36,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:36,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:36,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:36,130 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:36,437 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.526906967163086 s; generated tokens: 20 tokens; generate speed: 13.098374969864054 tokens/s +2024-07-30 13:53:36,442 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:36,442 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[333/2067], cost time 1.5382s, every example cost time is 1.5382, generate speed: 13.0021 tokens/s, avg speed: 10.5455 tokens/s, remaining time: 0:39:53 +pred is: + ['2006'] + label is: + ['2006'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:53:36,525 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:36,525 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 132, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:36,525 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:36,526 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:36,526 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:37,468 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:37,499 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:37,530 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:37,561 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:37,592 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:37,622 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:37,653 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:37,683 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:37,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:37,745 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:37,808 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2823567390441895 s; generated tokens: 12 tokens; generate speed: 9.357770450790671 tokens/s +2024-07-30 13:53:37,813 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:37,813 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[334/2067], cost time 1.2935s, every example cost time is 1.2935, generate speed: 9.2772 tokens/s, avg speed: 10.5420 tokens/s, remaining time: 0:39:52 +pred is: + ['41,004'] + label is: + ['41,004'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:53:37,895 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:37,896 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 100, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:37,896 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:37,896 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:37,897 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:38,838 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:38,870 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:38,901 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:38,932 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:38,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:39,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:39,034 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:39,065 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:39,095 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:39,126 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:39,190 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2928524017333984 s; generated tokens: 12 tokens; generate speed: 9.281801993724063 tokens/s +2024-07-30 13:53:39,194 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:39,195 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[335/2067], cost time 1.3040s, every example cost time is 1.3040, generate speed: 9.2028 tokens/s, avg speed: 10.5382 tokens/s, remaining time: 0:39:50 +pred is: + ['alternative licensing programs'] + label is: + ['alternative licensing programs'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:53:39,278 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:39,279 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 157, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:39,279 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:39,279 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:39,279 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:40,223 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:40,256 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:40,287 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:40,318 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:40,348 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:40,379 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:40,410 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:40,440 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:40,471 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:40,502 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:40,565 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2856199741363525 s; generated tokens: 12 tokens; generate speed: 9.334018015752518 tokens/s +2024-07-30 13:53:40,570 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:40,570 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[336/2067], cost time 1.2968s, every example cost time is 1.2968, generate speed: 9.2538 tokens/s, avg speed: 10.5346 tokens/s, remaining time: 0:39:48 +pred is: + ['The General Teaching Council for Scotland (GTCS)'] + label is: + ['the General Teaching Council for Scotland (GTCS)'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:53:40,654 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:40,654 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 193, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:40,654 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:40,654 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:40,655 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:41,598 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:41,633 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:41,665 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:41,695 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:41,726 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:41,757 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:41,787 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:41,818 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:41,849 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:41,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:42,003 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3485107421875 s; generated tokens: 14 tokens; generate speed: 10.381823119398932 tokens/s +2024-07-30 13:53:42,008 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:42,009 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[337/2067], cost time 1.3597s, every example cost time is 1.3597, generate speed: 10.2965 tokens/s, avg speed: 10.5339 tokens/s, remaining time: 0:39:46 +pred is: + ['April'] + label is: + ['April 2008'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:53:42,090 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:42,090 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 157, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:42,091 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:42,091 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:42,091 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:43,034 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:43,087 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:43,118 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:43,121 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0295612812042236 s; generated tokens: 3 tokens; generate speed: 2.9138624914983766 tokens/s +2024-07-30 13:53:43,126 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:43,126 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[338/2067], cost time 1.0407s, every example cost time is 1.0407, generate speed: 2.8826 tokens/s, avg speed: 10.5168 tokens/s, remaining time: 0:39:43 +pred is: + ['Education'] + label is: + ['Wales'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:53:43,208 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:43,208 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 120, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:43,209 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:43,209 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:43,209 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:44,151 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:44,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:44,214 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:44,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:44,275 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:44,306 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:44,336 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:44,367 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:44,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:44,428 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:44,736 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5264544486999512 s; generated tokens: 20 tokens; generate speed: 13.102257992063619 tokens/s +2024-07-30 13:53:44,740 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:44,741 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[339/2067], cost time 1.5376s, every example cost time is 1.5376, generate speed: 13.0070 tokens/s, avg speed: 10.5250 tokens/s, remaining time: 0:39:43 +pred is: + ['1'] + label is: + ['trade unions'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:53:44,822 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:44,822 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 204, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:44,823 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:44,823 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:44,823 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:45,766 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:45,798 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:45,829 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:45,860 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:45,891 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:45,921 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:45,952 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:45,983 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:46,014 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:46,045 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:46,353 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5296778678894043 s; generated tokens: 20 tokens; generate speed: 13.074648211780234 tokens/s +2024-07-30 13:53:46,358 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:46,358 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[340/2067], cost time 1.5408s, every example cost time is 1.5408, generate speed: 12.9802 tokens/s, avg speed: 10.5331 tokens/s, remaining time: 0:39:42 +pred is: + ['1'] + label is: + ['each state'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 62.38108819198175, Em score: 51.1764705882353, current_count: 340 +2024-07-30 13:53:46,551 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:46,552 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 466, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:46,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:46,552 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:46,553 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:47,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:47,533 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:47,564 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:47,595 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:47,626 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:47,657 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:47,688 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:47,719 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:47,750 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:47,781 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:48,092 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.539262056350708 s; generated tokens: 20 tokens; generate speed: 12.993239141758696 tokens/s +2024-07-30 13:53:48,097 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:48,097 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[341/2067], cost time 1.5510s, every example cost time is 1.5510, generate speed: 12.8952 tokens/s, avg speed: 10.5409 tokens/s, remaining time: 0:39:42 +pred is: + ['relatively low salaries'] + label is: + ['relatively low salaries'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:53:48,180 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:48,180 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 470, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:48,180 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:48,181 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:48,181 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:49,127 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:49,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:49,190 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:49,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:49,252 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:49,304 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:49,335 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:49,366 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:49,397 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:49,435 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:49,749 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5681626796722412 s; generated tokens: 20 tokens; generate speed: 12.753778838927708 tokens/s +2024-07-30 13:53:49,754 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:49,754 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[342/2067], cost time 1.5796s, every example cost time is 1.5796, generate speed: 12.6617 tokens/s, avg speed: 10.5480 tokens/s, remaining time: 0:39:41 +pred is: + ['There are many forms of spiritual or religious teachers in Christianity, across all three major traditions - ('] + label is: + ['many'] +The F1/Em of this example is: {'F1': 5.555555555555556, 'Em': 0.0} +2024-07-30 13:53:49,838 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:49,838 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 308, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:49,839 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:49,839 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:49,839 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:50,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:50,818 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:50,849 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:50,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:50,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:50,975 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:51,006 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:51,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:51,068 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:51,071 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2311384677886963 s; generated tokens: 9 tokens; generate speed: 7.310306870814709 tokens/s +2024-07-30 13:53:51,075 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:51,076 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[343/2067], cost time 1.2424s, every example cost time is 1.2424, generate speed: 7.2442 tokens/s, avg speed: 10.5393 tokens/s, remaining time: 0:39:39 +pred is: + ['LDS'] + label is: + ['LDS Church'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:53:51,158 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:51,158 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 105, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:51,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:51,159 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:51,159 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:52,101 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:52,133 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:52,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:52,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:52,225 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:52,284 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:52,316 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:52,346 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:52,377 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:52,408 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:52,713 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5543277263641357 s; generated tokens: 20 tokens; generate speed: 12.867299257913743 tokens/s +2024-07-30 13:53:52,718 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:52,719 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[344/2067], cost time 1.5655s, every example cost time is 1.5655, generate speed: 12.7751 tokens/s, avg speed: 10.5467 tokens/s, remaining time: 0:39:39 +pred is: + ['Guru'] + label is: + ['guru'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:53:52,801 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:52,801 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 104, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:52,802 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:52,802 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:52,802 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:53,744 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:53,776 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:53,807 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:53,838 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:53,840 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0378825664520264 s; generated tokens: 4 tokens; generate speed: 3.8540005673993467 tokens/s +2024-07-30 13:53:53,845 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:53,845 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[345/2067], cost time 1.0489s, every example cost time is 1.0489, generate speed: 3.8136 tokens/s, avg speed: 10.5318 tokens/s, remaining time: 0:39:36 +pred is: + ['Lama'] + label is: + ['a Lama'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:53:53,927 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:53,927 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 221, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:53,927 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:53,928 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:53,928 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:54,872 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:54,904 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:54,935 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:54,966 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:54,996 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:55,027 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:55,058 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:55,088 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:55,119 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:55,150 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:55,477 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5487565994262695 s; generated tokens: 20 tokens; generate speed: 12.913585005809768 tokens/s +2024-07-30 13:53:55,481 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:55,482 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[346/2067], cost time 1.5600s, every example cost time is 1.5600, generate speed: 12.8208 tokens/s, avg speed: 10.5393 tokens/s, remaining time: 0:39:35 +pred is: + ['Ulemas'] + label is: + ['ulemas'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:53:55,565 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:55,565 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 247, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:55,565 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:55,566 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:55,566 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:56,510 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:56,541 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:56,572 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:56,603 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:56,634 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:56,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:56,695 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:56,725 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:56,756 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:56,787 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:57,094 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.527655839920044 s; generated tokens: 20 tokens; generate speed: 13.09195401043129 tokens/s +2024-07-30 13:53:57,098 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:57,099 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[347/2067], cost time 1.5387s, every example cost time is 1.5387, generate speed: 12.9978 tokens/s, avg speed: 10.5472 tokens/s, remaining time: 0:39:35 +pred is: + ['German'] + label is: + ['German'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:53:57,181 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:57,181 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:57,182 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:57,182 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:57,182 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:58,125 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:58,157 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:58,188 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:58,219 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:58,250 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:58,280 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:58,311 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:58,342 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:58,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:58,403 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:58,620 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.43752121925354 s; generated tokens: 17 tokens; generate speed: 11.825912391628952 tokens/s +2024-07-30 13:53:58,625 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:58,625 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[348/2067], cost time 1.4487s, every example cost time is 1.4487, generate speed: 11.7345 tokens/s, avg speed: 10.5508 tokens/s, remaining time: 0:39:34 +pred is: + ['Through faith in Jesus Christ as redeemer from sin'] + label is: + ["gift of God's grace"] +The F1/Em of this example is: {'F1': 7.692307692307692, 'Em': 0.0} +2024-07-30 13:53:58,708 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:58,708 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 155, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:58,708 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:58,709 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:58,709 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:53:59,652 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:59,685 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:59,716 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:59,746 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:59,749 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0402741432189941 s; generated tokens: 4 tokens; generate speed: 3.845140270066231 tokens/s +2024-07-30 13:53:59,754 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:53:59,754 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[349/2067], cost time 1.0515s, every example cost time is 1.0515, generate speed: 3.8039 tokens/s, avg speed: 10.5360 tokens/s, remaining time: 0:39:31 +pred is: + ['Bible'] + label is: + ['Bible'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:53:59,836 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:53:59,837 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 320, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:53:59,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:53:59,837 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:53:59,838 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:00,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:00,815 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:00,846 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:00,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:00,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:00,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:00,969 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:01,000 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:01,030 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:01,061 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:01,277 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4397215843200684 s; generated tokens: 17 tokens; generate speed: 11.807838532912266 tokens/s +2024-07-30 13:54:01,282 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:01,283 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[350/2067], cost time 1.4508s, every example cost time is 1.4508, generate speed: 11.7176 tokens/s, avg speed: 10.5396 tokens/s, remaining time: 0:39:30 +pred is: + ['1483'] + label is: + ['10 November 1483'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +F1 score: 62.4461462338714, Em score: 51.142857142857146, current_count: 350 +2024-07-30 13:54:01,447 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:01,447 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 118, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:01,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:01,448 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:01,448 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:02,389 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:02,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:02,452 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:02,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:02,513 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:02,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:02,546 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0976462364196777 s; generated tokens: 6 tokens; generate speed: 5.466242037663162 tokens/s +2024-07-30 13:54:02,551 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:02,551 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[351/2067], cost time 1.1087s, every example cost time is 1.1087, generate speed: 5.4116 tokens/s, avg speed: 10.5279 tokens/s, remaining time: 0:39:27 +pred is: + ['University of Erfurt'] + label is: + ['University of Erfurt'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:54:02,633 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:02,633 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 255, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:02,634 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:02,634 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:02,634 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:03,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:03,611 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:03,642 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:03,673 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:03,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:03,734 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:03,765 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:03,796 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:03,826 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:03,857 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:04,164 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.529771327972412 s; generated tokens: 20 tokens; generate speed: 13.073849427226733 tokens/s +2024-07-30 13:54:04,169 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:04,169 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[352/2067], cost time 1.5409s, every example cost time is 1.5409, generate speed: 12.9791 tokens/s, avg speed: 10.5356 tokens/s, remaining time: 0:39:26 +pred is: + ['Law'] + label is: + ['law'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:54:04,251 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:04,251 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 242, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:04,252 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:04,252 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:04,252 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:05,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:05,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:05,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:05,289 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:05,319 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:05,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:05,381 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:05,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:05,442 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:05,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:05,796 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5439465045928955 s; generated tokens: 20 tokens; generate speed: 12.953816690218524 tokens/s +2024-07-30 13:54:05,801 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:05,801 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[353/2067], cost time 1.5551s, every example cost time is 1.5551, generate speed: 12.8610 tokens/s, avg speed: 10.5431 tokens/s, remaining time: 0:39:26 +pred is: + ['Divine judgment'] + label is: + ['death and divine judgment,'] +The F1/Em of this example is: {'F1': 54.54545454545454, 'Em': 0.0} +2024-07-30 13:54:05,883 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:05,883 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 169, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:05,884 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:05,884 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:05,884 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:06,827 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:06,860 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:06,891 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:06,921 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:06,924 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0396440029144287 s; generated tokens: 4 tokens; generate speed: 3.847470854241279 tokens/s +2024-07-30 13:54:06,929 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:06,929 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[354/2067], cost time 1.0508s, every example cost time is 1.0508, generate speed: 3.8068 tokens/s, avg speed: 10.5286 tokens/s, remaining time: 0:39:23 +pred is: + ['Prayer'] + label is: + ['Augustinian order'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:54:07,011 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:07,011 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 125, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:07,012 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:07,012 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:07,012 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:07,954 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:07,985 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:08,016 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:08,047 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:08,049 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.036914587020874 s; generated tokens: 4 tokens; generate speed: 3.8575983500167275 tokens/s +2024-07-30 13:54:08,054 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:08,054 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[355/2067], cost time 1.0480s, every example cost time is 1.0480, generate speed: 3.8167 tokens/s, avg speed: 10.5142 tokens/s, remaining time: 0:39:20 +pred is: + ['1507'] + label is: + ['1507'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:54:08,136 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:08,136 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 121, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:08,137 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:08,137 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:08,137 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:09,079 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:09,112 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:09,143 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:09,174 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:09,204 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:09,235 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:09,265 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:09,268 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1305797100067139 s; generated tokens: 7 tokens; generate speed: 6.191513909230187 tokens/s +2024-07-30 13:54:09,273 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:09,273 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[356/2067], cost time 1.1417s, every example cost time is 1.1417, generate speed: 6.1314 tokens/s, avg speed: 10.5040 tokens/s, remaining time: 0:39:17 +pred is: + ['19 October 1512'] + label is: + ['19 October 1512'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:54:09,355 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:09,355 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 165, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:09,356 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:09,356 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:09,356 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:10,299 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:10,332 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:10,363 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:10,394 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:10,397 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0400826930999756 s; generated tokens: 4 tokens; generate speed: 3.8458480527908456 tokens/s +2024-07-30 13:54:10,401 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:10,402 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[357/2067], cost time 1.0513s, every example cost time is 1.0513, generate speed: 3.8049 tokens/s, avg speed: 10.4897 tokens/s, remaining time: 0:39:14 +pred is: + ['1516'] + label is: + ['1516'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:54:10,483 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:10,483 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 237, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:10,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:10,484 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:10,484 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:11,427 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:11,459 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:11,490 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:11,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:11,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:11,583 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:11,613 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:11,644 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:11,675 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:11,706 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:12,014 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5294044017791748 s; generated tokens: 20 tokens; generate speed: 13.07698603242789 tokens/s +2024-07-30 13:54:12,019 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:12,019 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[358/2067], cost time 1.5406s, every example cost time is 1.5406, generate speed: 12.9821 tokens/s, avg speed: 10.4974 tokens/s, remaining time: 0:39:14 +pred is: + ['31 October 1517'] + label is: + ['31 October 1517'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:54:12,102 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:12,102 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 92, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:12,102 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:12,103 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:12,103 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:13,044 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:13,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:13,107 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:13,137 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:13,168 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:13,198 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:13,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:13,259 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:13,290 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:13,320 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:13,626 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5229485034942627 s; generated tokens: 20 tokens; generate speed: 13.132420402995816 tokens/s +2024-07-30 13:54:13,631 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:13,631 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[359/2067], cost time 1.5341s, every example cost time is 1.5341, generate speed: 13.0373 tokens/s, avg speed: 10.5053 tokens/s, remaining time: 0:39:13 +pred is: + ['Johann Tetzel'] + label is: + ['Johann Tetzel'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:54:13,713 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:13,714 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 104, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:13,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:13,714 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:13,714 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:14,655 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:14,687 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:14,718 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:14,749 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:14,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:14,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:14,840 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:14,875 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:14,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:14,937 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:15,243 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5280718803405762 s; generated tokens: 20 tokens; generate speed: 13.088389530172106 tokens/s +2024-07-30 13:54:15,247 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:15,248 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[360/2067], cost time 1.5392s, every example cost time is 1.5392, generate speed: 12.9935 tokens/s, avg speed: 10.5130 tokens/s, remaining time: 0:39:13 +pred is: + ['God'] + label is: + ['God'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 63.08526843444568, Em score: 51.94444444444444, current_count: 360 +2024-07-30 13:54:15,416 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:15,416 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 125, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:15,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:15,417 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:15,417 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:16,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:16,391 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:16,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:16,452 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:16,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:16,513 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:16,544 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:16,574 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:16,605 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:16,635 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:16,943 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5261781215667725 s; generated tokens: 20 tokens; generate speed: 13.104630263909186 tokens/s +2024-07-30 13:54:16,948 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:16,949 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[361/2067], cost time 1.5385s, every example cost time is 1.5385, generate speed: 12.9999 tokens/s, avg speed: 10.5207 tokens/s, remaining time: 0:39:12 +pred is: + ['1'] + label is: + ['Tetzel'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:54:17,031 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:17,031 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 129, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:17,031 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:17,032 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:17,032 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:17,973 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:18,005 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:18,036 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:18,067 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:18,098 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:18,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:18,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:18,190 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:18,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:18,251 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:18,559 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.527104139328003 s; generated tokens: 20 tokens; generate speed: 13.09668377220229 tokens/s +2024-07-30 13:54:18,564 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:18,564 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[362/2067], cost time 1.5385s, every example cost time is 1.5385, generate speed: 12.9999 tokens/s, avg speed: 10.5284 tokens/s, remaining time: 0:39:11 +pred is: + ['The story of the posting on the door'] + label is: + ['the posting on the door'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 13:54:18,647 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:18,647 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 120, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:18,648 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:18,648 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:18,648 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:19,591 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:19,623 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:19,655 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:19,685 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:19,716 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:19,747 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:19,750 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1016886234283447 s; generated tokens: 6 tokens; generate speed: 5.446184949544636 tokens/s +2024-07-30 13:54:19,755 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:19,755 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[363/2067], cost time 1.1129s, every example cost time is 1.1129, generate speed: 5.3912 tokens/s, avg speed: 10.5169 tokens/s, remaining time: 0:39:09 +pred is: + ['January 1518'] + label is: + ['January 1518'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:54:19,837 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:19,837 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:19,838 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:19,838 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:19,838 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:20,780 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:20,813 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:20,843 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:20,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:20,905 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:20,936 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:20,966 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:20,997 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:21,027 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:21,058 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:21,091 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2525584697723389 s; generated tokens: 11 tokens; generate speed: 8.782025163263896 tokens/s +2024-07-30 13:54:21,096 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:21,096 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[364/2067], cost time 1.2637s, every example cost time is 1.2637, generate speed: 8.7045 tokens/s, avg speed: 10.5124 tokens/s, remaining time: 0:39:07 +pred is: + ['1519'] + label is: + ['1519'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:54:21,178 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:21,178 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 237, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:21,179 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:21,179 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:21,179 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:22,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:22,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:22,186 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:22,217 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:22,248 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:22,278 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:22,309 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:22,340 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:22,371 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:22,402 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:22,709 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5291495323181152 s; generated tokens: 20 tokens; generate speed: 13.079165625928674 tokens/s +2024-07-30 13:54:22,713 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:22,714 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[365/2067], cost time 1.5403s, every example cost time is 1.5403, generate speed: 12.9842 tokens/s, avg speed: 10.5199 tokens/s, remaining time: 0:39:06 +pred is: + ['He lectured on the Psalms, the books of Hebrews, Romans, and Gal'] + label is: + ['lectured'] +The F1/Em of this example is: {'F1': 7.4074074074074066, 'Em': 0.0} +2024-07-30 13:54:22,796 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:22,796 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 312, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:22,797 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:22,797 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:22,797 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:23,742 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:23,774 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:23,805 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:23,808 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0101852416992188 s; generated tokens: 3 tokens; generate speed: 2.969752354482769 tokens/s +2024-07-30 13:54:23,812 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:23,813 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[366/2067], cost time 1.0213s, every example cost time is 1.0213, generate speed: 2.9375 tokens/s, avg speed: 10.5046 tokens/s, remaining time: 0:39:03 +pred is: + ['God'] + label is: + ['God'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:54:23,894 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:23,895 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 89, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:23,895 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:23,895 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:23,895 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:24,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:24,870 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:24,900 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:24,931 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:24,962 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:24,992 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:25,023 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:25,053 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:25,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:25,114 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:25,419 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5232934951782227 s; generated tokens: 20 tokens; generate speed: 13.129446205414299 tokens/s +2024-07-30 13:54:25,424 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:25,424 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[367/2067], cost time 1.5345s, every example cost time is 1.5345, generate speed: 13.0334 tokens/s, avg speed: 10.5123 tokens/s, remaining time: 0:39:02 +pred is: + ['The rediscovery of "Christ and His salvation"'] + label is: + ['Christ and His salvation'] +The F1/Em of this example is: {'F1': 63.63636363636363, 'Em': 0.0} +2024-07-30 13:54:25,506 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:25,507 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 159, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:25,507 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:25,507 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:25,507 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:26,449 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:26,480 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:26,511 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:26,542 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:26,572 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:26,603 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:26,634 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:26,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:26,694 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:26,725 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:27,034 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5262212753295898 s; generated tokens: 20 tokens; generate speed: 13.104259731722694 tokens/s +2024-07-30 13:54:27,039 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:27,039 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[368/2067], cost time 1.5373s, every example cost time is 1.5373, generate speed: 13.0098 tokens/s, avg speed: 10.5198 tokens/s, remaining time: 0:39:02 +pred is: + ['Archbishop Albrecht of Mainz and Magdeburg'] + label is: + ['Archbishop Albrecht'] +The F1/Em of this example is: {'F1': 42.857142857142854, 'Em': 0.0} +2024-07-30 13:54:27,122 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:27,122 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 306, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:27,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:27,123 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:27,123 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:28,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:28,101 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:28,132 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:28,163 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:28,194 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:28,224 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:28,255 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:28,286 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:28,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:28,347 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:28,503 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3798236846923828 s; generated tokens: 15 tokens; generate speed: 10.87095414175623 tokens/s +2024-07-30 13:54:28,508 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:28,508 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[369/2067], cost time 1.3910s, every example cost time is 1.3910, generate speed: 10.7838 tokens/s, avg speed: 10.5205 tokens/s, remaining time: 0:39:00 +pred is: + ['1'] + label is: + ['Pope Leo X'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:54:28,590 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:28,590 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 246, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:28,590 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:28,591 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:28,591 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:29,535 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:29,566 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:29,604 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:29,635 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:29,666 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:29,697 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:29,727 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:29,758 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:29,789 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:29,819 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:30,126 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5346498489379883 s; generated tokens: 20 tokens; generate speed: 13.032288775084716 tokens/s +2024-07-30 13:54:30,130 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:30,131 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[370/2067], cost time 1.5457s, every example cost time is 1.5457, generate speed: 12.9394 tokens/s, avg speed: 10.5279 tokens/s, remaining time: 0:39:00 +pred is: + ['January 1519'] + label is: + ['January 1519'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.97188527108475, Em score: 51.62162162162162, current_count: 370 +2024-07-30 13:54:30,301 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:30,301 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 234, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:30,302 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:30,302 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:30,302 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:31,245 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:31,277 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:31,309 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:31,339 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:31,370 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:31,403 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:31,434 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:31,465 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:31,495 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:31,526 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:31,833 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5310041904449463 s; generated tokens: 20 tokens; generate speed: 13.063321527674933 tokens/s +2024-07-30 13:54:31,838 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:31,838 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[371/2067], cost time 1.5422s, every example cost time is 1.5422, generate speed: 12.9688 tokens/s, avg speed: 10.5352 tokens/s, remaining time: 0:38:59 +pred is: + ['15 June 1520'] + label is: + ['15 June 1520'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:54:31,920 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:31,920 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 157, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:31,921 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:31,921 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:31,921 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:32,864 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:32,895 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:32,926 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:32,957 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:32,987 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:32,990 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.068467617034912 s; generated tokens: 5 tokens; generate speed: 4.679599007291791 tokens/s +2024-07-30 13:54:32,994 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:32,995 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[372/2067], cost time 1.0793s, every example cost time is 1.0793, generate speed: 4.6327 tokens/s, avg speed: 10.5228 tokens/s, remaining time: 0:38:56 +pred is: + ['The secular authorities'] + label is: + ['secular authorities'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 13:54:33,076 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:33,077 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 134, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:33,077 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:33,077 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:33,078 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:34,020 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:34,053 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:34,083 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:34,114 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:34,145 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:34,175 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:34,206 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:34,236 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:34,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:34,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:34,606 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.528390645980835 s; generated tokens: 20 tokens; generate speed: 13.085659777226082 tokens/s +2024-07-30 13:54:34,611 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:34,611 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[373/2067], cost time 1.5395s, every example cost time is 1.5395, generate speed: 12.9910 tokens/s, avg speed: 10.5302 tokens/s, remaining time: 0:38:56 +pred is: + ['Johann Eck'] + label is: + ['Johann Eck'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:54:34,693 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:34,694 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 90, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:34,694 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:34,694 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:34,694 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:35,635 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:35,667 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:35,697 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:35,728 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:35,758 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:35,789 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:35,819 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:35,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:35,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:35,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:36,064 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3696935176849365 s; generated tokens: 15 tokens; generate speed: 10.951355034046655 tokens/s +2024-07-30 13:54:36,069 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:36,069 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[374/2067], cost time 1.3806s, every example cost time is 1.3806, generate speed: 10.8647 tokens/s, avg speed: 10.5311 tokens/s, remaining time: 0:38:54 +pred is: + ['Raised his arm in the traditional salute of a knight winning a bout'] + label is: + ['raised his arm'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +2024-07-30 13:54:36,152 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:36,152 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 143, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:36,153 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:36,153 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:36,153 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:37,095 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:37,127 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:37,163 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:37,194 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:37,225 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:37,255 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:37,258 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1049058437347412 s; generated tokens: 6 tokens; generate speed: 5.430326967698111 tokens/s +2024-07-30 13:54:37,263 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:37,263 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[375/2067], cost time 1.1160s, every example cost time is 1.1160, generate speed: 5.3762 tokens/s, avg speed: 10.5200 tokens/s, remaining time: 0:38:52 +pred is: + ['Recant his writings'] + label is: + ['recant his writings'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:54:37,344 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:37,345 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 140, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:37,345 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:37,345 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:37,346 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:38,287 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:38,319 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:38,349 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:38,380 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:38,410 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:38,412 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0667686462402344 s; generated tokens: 5 tokens; generate speed: 4.687051890418992 tokens/s +2024-07-30 13:54:38,417 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:38,417 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[376/2067], cost time 1.0776s, every example cost time is 1.0776, generate speed: 4.6401 tokens/s, avg speed: 10.5077 tokens/s, remaining time: 0:38:49 +pred is: + ['By the Emperor'] + label is: + ['private conferences'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 13:54:38,499 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:38,500 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 222, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:38,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:38,500 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:38,500 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:39,444 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:39,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:39,515 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:39,546 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:39,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:39,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:39,638 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:39,669 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:39,700 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:39,731 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:40,047 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5459229946136475 s; generated tokens: 20 tokens; generate speed: 12.93725500538165 tokens/s +2024-07-30 13:54:40,051 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:40,052 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[377/2067], cost time 1.5575s, every example cost time is 1.5575, generate speed: 12.8415 tokens/s, avg speed: 10.5147 tokens/s, remaining time: 0:38:49 +pred is: + ['His disappearance during his return trip back to Wittenberg'] + label is: + ["Luther's disappearance"] +The F1/Em of this example is: {'F1': 18.18181818181818, 'Em': 0.0} +2024-07-30 13:54:40,134 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:40,135 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 189, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:40,135 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:40,135 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:40,135 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:41,078 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:41,110 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:41,141 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:41,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:41,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:41,233 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:41,264 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:41,294 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:41,325 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:41,355 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:41,661 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.525259256362915 s; generated tokens: 20 tokens; generate speed: 13.112524914414463 tokens/s +2024-07-30 13:54:41,666 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:41,666 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[378/2067], cost time 1.5364s, every example cost time is 1.5364, generate speed: 13.0175 tokens/s, avg speed: 10.5221 tokens/s, remaining time: 0:38:48 +pred is: + ['sin'] + label is: + ['a sin'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:54:41,748 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:41,748 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 207, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:41,749 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:41,749 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:41,749 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:42,692 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:42,724 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:42,754 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:42,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:42,815 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:42,846 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:42,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:42,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:42,937 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:42,968 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:43,276 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5264687538146973 s; generated tokens: 20 tokens; generate speed: 13.102135205859485 tokens/s +2024-07-30 13:54:43,281 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:43,281 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[379/2067], cost time 1.5376s, every example cost time is 1.5376, generate speed: 13.0070 tokens/s, avg speed: 10.5294 tokens/s, remaining time: 0:38:47 +pred is: + ['1521'] + label is: + ['summer of 1521'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +2024-07-30 13:54:43,363 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:43,364 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 149, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:43,364 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:43,364 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:43,364 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:44,306 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:44,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:44,368 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:44,399 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:44,429 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:44,459 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:44,490 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:44,520 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:44,551 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:44,581 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:44,584 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2192935943603516 s; generated tokens: 10 tokens; generate speed: 8.201470135046561 tokens/s +2024-07-30 13:54:44,588 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:44,589 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[380/2067], cost time 1.2302s, every example cost time is 1.2302, generate speed: 8.1286 tokens/s, avg speed: 10.5238 tokens/s, remaining time: 0:38:45 +pred is: + ['He placed it on prophetic faith.'] + label is: + ['prophetic faith'] +The F1/Em of this example is: {'F1': 40.0, 'Em': 0.0} +F1 score: 62.82748956618381, Em score: 51.05263157894737, current_count: 380 +2024-07-30 13:54:44,770 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:44,771 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 254, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:44,771 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:44,771 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:44,772 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:45,716 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:45,748 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:45,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:45,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:45,840 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:45,871 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:45,902 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:45,933 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:45,964 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:45,994 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:46,306 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5339829921722412 s; generated tokens: 20 tokens; generate speed: 13.037954202920085 tokens/s +2024-07-30 13:54:46,311 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:46,311 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[381/2067], cost time 1.5455s, every example cost time is 1.5455, generate speed: 12.9404 tokens/s, avg speed: 10.5309 tokens/s, remaining time: 0:38:45 +pred is: + ['Gabriel Zwilling'] + label is: + ['Gabriel Zwilling'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:54:46,394 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:46,394 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 182, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:46,394 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:46,394 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:46,395 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:47,337 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:47,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:47,399 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:47,430 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:47,461 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:47,491 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:47,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:47,553 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:47,583 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:47,614 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:47,924 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5289115905761719 s; generated tokens: 20 tokens; generate speed: 13.081201112788333 tokens/s +2024-07-30 13:54:47,929 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:47,929 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[382/2067], cost time 1.5401s, every example cost time is 1.5401, generate speed: 12.9864 tokens/s, avg speed: 10.5381 tokens/s, remaining time: 0:38:44 +pred is: + ['6 March 1522'] + label is: + ['6 March 1522'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:54:48,011 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:48,011 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 113, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:48,011 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:48,012 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:48,012 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:48,953 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:48,986 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:49,016 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:49,047 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:49,078 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:49,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:49,139 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:49,170 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:49,201 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:49,231 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:49,453 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4415085315704346 s; generated tokens: 17 tokens; generate speed: 11.79320109987802 tokens/s +2024-07-30 13:54:49,458 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:49,459 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[383/2067], cost time 1.4529s, every example cost time is 1.4529, generate speed: 11.7010 tokens/s, avg speed: 10.5413 tokens/s, remaining time: 0:38:43 +pred is: + ['immediate'] + label is: + ['immediate'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:54:49,542 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:49,542 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 123, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:49,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:49,543 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:49,543 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:50,485 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:50,517 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:50,548 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:50,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:50,581 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0375511646270752 s; generated tokens: 4 tokens; generate speed: 3.8552315648334425 tokens/s +2024-07-30 13:54:50,586 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:50,586 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[384/2067], cost time 1.0488s, every example cost time is 1.0488, generate speed: 3.8140 tokens/s, avg speed: 10.5279 tokens/s, remaining time: 0:38:40 +pred is: + ['public order'] + label is: + ['public order'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:54:50,668 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:50,668 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 244, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:50,668 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:50,669 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:50,669 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:51,612 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:51,644 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:51,675 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:51,706 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:51,736 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:51,767 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:51,798 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:51,828 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:51,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:51,890 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:52,075 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.405940055847168 s; generated tokens: 16 tokens; generate speed: 11.380286046661489 tokens/s +2024-07-30 13:54:52,080 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:52,080 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[385/2067], cost time 1.4171s, every example cost time is 1.4171, generate speed: 11.2905 tokens/s, avg speed: 10.5300 tokens/s, remaining time: 0:38:39 +pred is: + ['A preacher'] + label is: + ['Zwickau prophet'] +The F1/Em of this example is: {'F1': 33.33333333333333, 'Em': 0.0} +2024-07-30 13:54:52,162 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:52,163 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:52,163 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:52,163 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:52,164 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:53,107 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:53,139 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:53,170 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:53,200 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:53,231 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:53,234 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0700874328613281 s; generated tokens: 5 tokens; generate speed: 4.672515391224061 tokens/s +2024-07-30 13:54:53,239 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:53,239 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[386/2067], cost time 1.0812s, every example cost time is 1.0812, generate speed: 4.6244 tokens/s, avg speed: 10.5180 tokens/s, remaining time: 0:38:36 +pred is: + ['the temporal authorities'] + label is: + ['temporal authorities'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 13:54:53,321 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:53,321 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 230, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:53,322 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:53,322 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:53,322 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:54,265 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:54,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:54,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:54,358 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:54,389 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:54,420 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:54,450 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:54,481 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:54,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:54,542 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:54,849 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5267484188079834 s; generated tokens: 20 tokens; generate speed: 13.099735197770896 tokens/s +2024-07-30 13:54:54,854 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:54,854 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[387/2067], cost time 1.5379s, every example cost time is 1.5379, generate speed: 13.0050 tokens/s, avg speed: 10.5251 tokens/s, remaining time: 0:38:35 +pred is: + ['3'] + label is: + ['on three grounds'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:54:54,936 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:54,936 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 141, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:54,936 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:54,937 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:54,937 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:55,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:55,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:55,941 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:55,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:56,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:56,033 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:56,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:56,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:56,125 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:56,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:56,442 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5048422813415527 s; generated tokens: 19 tokens; generate speed: 12.625907867940604 tokens/s +2024-07-30 13:54:56,447 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:56,447 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[388/2067], cost time 1.5161s, every example cost time is 1.5161, generate speed: 12.5319 tokens/s, avg speed: 10.5308 tokens/s, remaining time: 0:38:35 +pred is: + ['He denied them his support'] + label is: + ['backing for the uprising'] +The F1/Em of this example is: {'F1': 12.5, 'Em': 0.0} +2024-07-30 13:54:56,531 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:56,531 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 148, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:56,531 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:56,531 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:56,532 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:57,474 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:57,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:57,536 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:57,567 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:57,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:57,628 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:57,658 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:57,689 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:57,719 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:57,722 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.189993143081665 s; generated tokens: 9 tokens; generate speed: 7.563068789365588 tokens/s +2024-07-30 13:54:57,727 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:57,727 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[389/2067], cost time 1.2013s, every example cost time is 1.2013, generate speed: 7.4918 tokens/s, avg speed: 10.5240 tokens/s, remaining time: 0:38:32 +pred is: + ['Katharina von Bora'] + label is: + ['Katharina von Bora'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:54:57,808 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:57,808 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 132, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:57,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:57,809 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:57,809 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:54:58,751 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:58,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:58,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:58,844 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:58,875 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:58,905 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:58,936 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:58,966 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:58,997 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:59,027 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:59,332 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5232229232788086 s; generated tokens: 20 tokens; generate speed: 13.130054501116005 tokens/s +2024-07-30 13:54:59,337 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:54:59,337 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[390/2067], cost time 1.5344s, every example cost time is 1.5344, generate speed: 13.0348 tokens/s, avg speed: 10.5312 tokens/s, remaining time: 0:38:32 +pred is: + ['13 June 1525'] + label is: + ['13 June 1525'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 63.06481889354661, Em score: 51.282051282051285, current_count: 390 +2024-07-30 13:54:59,515 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:54:59,516 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 215, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:54:59,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:54:59,516 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:54:59,516 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:00,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:00,493 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:00,524 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:00,555 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:00,585 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:00,616 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:00,647 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:00,677 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:00,708 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:00,738 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:01,048 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5317347049713135 s; generated tokens: 20 tokens; generate speed: 13.05709137169061 tokens/s +2024-07-30 13:55:01,053 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:01,054 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[391/2067], cost time 1.5438s, every example cost time is 1.5438, generate speed: 12.9554 tokens/s, avg speed: 10.5381 tokens/s, remaining time: 0:38:31 +pred is: + ['The seal of approval'] + label is: + ['seal of approval'] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +2024-07-30 13:55:01,135 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:01,135 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 232, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:01,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:01,136 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:01,136 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:02,080 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:02,112 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:02,143 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:02,173 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:02,205 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:02,235 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:02,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:02,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:02,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:02,358 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:02,667 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5301079750061035 s; generated tokens: 20 tokens; generate speed: 13.070972981446111 tokens/s +2024-07-30 13:55:02,671 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:02,672 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[392/2067], cost time 1.5412s, every example cost time is 1.5412, generate speed: 12.9768 tokens/s, avg speed: 10.5451 tokens/s, remaining time: 0:38:30 +pred is: + ['1525-1534'] + label is: + ['The Black Cloister'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:55:02,753 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:02,754 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 252, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:02,754 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:02,754 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:02,754 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:03,698 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:03,730 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:03,761 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:03,792 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:03,823 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:03,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:03,884 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:03,916 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:03,947 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:03,978 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:04,287 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.532404899597168 s; generated tokens: 20 tokens; generate speed: 13.051380875418445 tokens/s +2024-07-30 13:55:04,292 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:04,292 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[393/2067], cost time 1.5436s, every example cost time is 1.5436, generate speed: 12.9567 tokens/s, avg speed: 10.5519 tokens/s, remaining time: 0:38:30 +pred is: + ["Congregations' choosing their own ministers"] + label is: + ['choosing their own ministers'] +The F1/Em of this example is: {'F1': 82.35294117647058, 'Em': 0.0} +2024-07-30 13:55:04,375 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:04,375 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 315, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:04,376 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:04,376 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:04,376 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:05,320 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:05,352 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:05,384 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:05,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:05,446 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:05,477 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:05,508 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:05,539 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:05,570 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:05,600 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:05,910 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5338504314422607 s; generated tokens: 20 tokens; generate speed: 13.039080988616501 tokens/s +2024-07-30 13:55:05,915 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:05,915 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[394/2067], cost time 1.5450s, every example cost time is 1.5450, generate speed: 12.9450 tokens/s, avg speed: 10.5587 tokens/s, remaining time: 0:38:29 +pred is: + ['Confusing or upsetting the people'] + label is: + ['extreme change'] +The F1/Em of this example is: {'F1': 16.666666666666664, 'Em': 0.0} +2024-07-30 13:55:05,997 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:05,998 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 295, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:05,998 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:05,998 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:05,999 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:06,943 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:06,976 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:07,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:07,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:07,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:07,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:07,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:07,162 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:07,193 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:07,224 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:07,535 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5359725952148438 s; generated tokens: 20 tokens; generate speed: 13.021065650720484 tokens/s +2024-07-30 13:55:07,539 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:07,540 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[395/2067], cost time 1.5472s, every example cost time is 1.5472, generate speed: 12.9265 tokens/s, avg speed: 10.5654 tokens/s, remaining time: 0:38:28 +pred is: + ['1526'] + label is: + ['early 1526'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:55:07,623 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:07,623 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 133, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:07,623 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:07,624 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:07,624 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:08,565 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:08,598 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:08,629 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:08,660 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:08,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:08,721 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:08,752 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:08,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:08,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:08,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:09,153 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.529176950454712 s; generated tokens: 20 tokens; generate speed: 13.078931116541389 tokens/s +2024-07-30 13:55:09,158 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:09,158 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[396/2067], cost time 1.5404s, every example cost time is 1.5404, generate speed: 12.9838 tokens/s, avg speed: 10.5723 tokens/s, remaining time: 0:38:28 +pred is: + ['1527'] + label is: + ['1527'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:55:09,241 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:09,241 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 191, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:09,241 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:09,242 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:09,242 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:10,185 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:10,218 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:10,249 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:10,280 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:10,311 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:10,342 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:10,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:10,403 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:10,434 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:10,464 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:10,771 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5289320945739746 s; generated tokens: 20 tokens; generate speed: 13.081025685168084 tokens/s +2024-07-30 13:55:10,776 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:10,776 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[397/2067], cost time 1.5402s, every example cost time is 1.5402, generate speed: 12.9849 tokens/s, avg speed: 10.5790 tokens/s, remaining time: 0:38:27 +pred is: + ['Catechism'] + label is: + ['catechism'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:55:10,859 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:10,859 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 172, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:10,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:10,860 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:10,860 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:11,802 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:11,836 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:11,867 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:11,898 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:11,929 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:11,959 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:11,990 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:12,021 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:12,051 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:12,082 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:12,390 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.529876708984375 s; generated tokens: 20 tokens; generate speed: 13.072948873950251 tokens/s +2024-07-30 13:55:12,395 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:12,395 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[398/2067], cost time 1.5412s, every example cost time is 1.5412, generate speed: 12.9771 tokens/s, avg speed: 10.5857 tokens/s, remaining time: 0:38:26 +pred is: + ['The catechism'] + label is: + ['The catechism'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:55:12,477 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:12,478 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 269, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:12,478 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:12,478 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:12,478 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:13,423 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:13,456 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:13,488 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:13,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:13,550 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:13,581 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:13,612 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:13,643 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:13,674 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:13,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:14,015 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.536158800125122 s; generated tokens: 20 tokens; generate speed: 13.019487307152733 tokens/s +2024-07-30 13:55:14,020 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:14,020 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[399/2067], cost time 1.5474s, every example cost time is 1.5474, generate speed: 12.9251 tokens/s, avg speed: 10.5923 tokens/s, remaining time: 0:38:26 +pred is: + ["Luther's Small Catechism"] + label is: + ['Small Catechism'] +The F1/Em of this example is: {'F1': 60.0, 'Em': 0.0} +2024-07-30 13:55:14,102 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:14,102 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 252, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:14,103 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:14,103 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:14,103 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:15,047 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:15,079 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:15,110 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:15,142 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:15,173 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:15,205 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:15,237 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:15,268 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:15,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:15,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:15,520 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4164230823516846 s; generated tokens: 16 tokens; generate speed: 11.29605991271706 tokens/s +2024-07-30 13:55:15,525 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:15,525 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[400/2067], cost time 1.4277s, every example cost time is 1.4277, generate speed: 11.2071 tokens/s, avg speed: 10.5939 tokens/s, remaining time: 0:38:24 +pred is: + ['1522'] + label is: + ['1522'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 63.21908077414911, Em score: 51.0, current_count: 400 +2024-07-30 13:55:15,703 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:15,703 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 112, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:15,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:15,704 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:15,704 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:16,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:16,678 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:16,709 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:16,740 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:16,771 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:16,801 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:16,833 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:16,863 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:16,895 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:16,927 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:17,236 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.531893253326416 s; generated tokens: 20 tokens; generate speed: 13.055739984865902 tokens/s +2024-07-30 13:55:17,241 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:17,241 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[401/2067], cost time 1.5431s, every example cost time is 1.5431, generate speed: 12.9610 tokens/s, avg speed: 10.6005 tokens/s, remaining time: 0:38:24 +pred is: + ['Saxon chancellery'] + label is: + ['Saxon chancellery'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:55:17,324 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:17,324 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 163, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:17,324 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:17,325 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:17,325 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:18,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:18,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:18,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:18,360 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:18,391 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:18,423 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:18,454 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:18,486 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:18,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:18,549 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:18,858 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5325126647949219 s; generated tokens: 20 tokens; generate speed: 13.050463111622223 tokens/s +2024-07-30 13:55:18,862 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:18,862 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[402/2067], cost time 1.5436s, every example cost time is 1.5436, generate speed: 12.9564 tokens/s, avg speed: 10.6070 tokens/s, remaining time: 0:38:23 +pred is: + ['German-language publications'] + label is: + ['German-language publications'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:55:18,945 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:18,945 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 203, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:18,946 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:18,946 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:18,946 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:19,890 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:19,922 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:19,954 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:19,985 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:20,016 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:20,047 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:20,050 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1035864353179932 s; generated tokens: 6 tokens; generate speed: 5.43681927213171 tokens/s +2024-07-30 13:55:20,055 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:20,055 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[403/2067], cost time 1.1147s, every example cost time is 1.1147, generate speed: 5.3826 tokens/s, avg speed: 10.5966 tokens/s, remaining time: 0:38:20 +pred is: + ['Hymn-writing'] + label is: + ['authoring hymns'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:55:20,138 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:20,138 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 176, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:20,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:20,139 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:20,139 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:21,082 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:21,121 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:21,153 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:21,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:21,215 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:21,245 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:21,276 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:21,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:21,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:21,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:21,677 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5378549098968506 s; generated tokens: 20 tokens; generate speed: 13.005128033399114 tokens/s +2024-07-30 13:55:21,682 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:21,682 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[404/2067], cost time 1.5491s, every example cost time is 1.5491, generate speed: 12.9109 tokens/s, avg speed: 10.6030 tokens/s, remaining time: 0:38:20 +pred is: + ['Particular events in his life and the unfolding Reformation'] + label is: + ['events in his life'] +The F1/Em of this example is: {'F1': 58.333333333333336, 'Em': 0.0} +2024-07-30 13:55:21,765 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:21,765 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 216, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:21,766 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:21,766 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:21,766 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:22,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:22,743 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:22,776 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:22,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:22,839 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:22,870 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:22,901 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:22,931 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:22,962 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:22,993 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:23,302 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.535595417022705 s; generated tokens: 20 tokens; generate speed: 13.024263929347402 tokens/s +2024-07-30 13:55:23,307 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:23,307 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[405/2067], cost time 1.5468s, every example cost time is 1.5468, generate speed: 12.9300 tokens/s, avg speed: 10.6094 tokens/s, remaining time: 0:38:19 +pred is: + ['1524'] + label is: + ['1524'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:55:23,389 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:23,389 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 199, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:23,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:23,390 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:23,390 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:24,333 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:24,365 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:24,397 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:24,453 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:24,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:24,515 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:24,546 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:24,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:24,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:24,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:24,825 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4346837997436523 s; generated tokens: 16 tokens; generate speed: 11.152283174075613 tokens/s +2024-07-30 13:55:24,830 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:24,830 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[406/2067], cost time 1.4458s, every example cost time is 1.4458, generate speed: 11.0665 tokens/s, avg speed: 10.6106 tokens/s, remaining time: 0:38:18 +pred is: + ['1538'] + label is: + ['1538'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:55:24,913 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:24,913 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 269, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:24,913 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:24,913 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:24,914 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:25,858 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:25,890 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:25,923 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:25,954 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:25,984 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:26,016 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:26,046 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:26,077 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:26,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:26,139 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:26,449 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5349609851837158 s; generated tokens: 20 tokens; generate speed: 13.02964713308739 tokens/s +2024-07-30 13:55:26,453 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:26,454 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[407/2067], cost time 1.5460s, every example cost time is 1.5460, generate speed: 12.9362 tokens/s, avg speed: 10.6170 tokens/s, remaining time: 0:38:17 +pred is: + ['1523'] + label is: + ['1523'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:55:26,536 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:26,536 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 362, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:26,537 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:26,537 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:26,537 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:27,483 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:27,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:27,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:27,579 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:27,610 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:27,641 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:27,672 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:27,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:27,735 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:27,766 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:28,078 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5408694744110107 s; generated tokens: 20 tokens; generate speed: 12.979684737829526 tokens/s +2024-07-30 13:55:28,083 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:28,083 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[408/2067], cost time 1.5521s, every example cost time is 1.5521, generate speed: 12.8856 tokens/s, avg speed: 10.6232 tokens/s, remaining time: 0:38:16 +pred is: + ['Nun komm, der Heiden Heiland'] + label is: + ['Nun komm, der Heiden Heiland'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:55:28,166 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:28,167 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 207, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:28,167 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:28,167 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:28,167 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:29,111 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:29,142 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:29,174 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:29,204 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:29,235 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:29,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:29,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:29,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:29,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:29,394 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:29,712 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5447487831115723 s; generated tokens: 20 tokens; generate speed: 12.947089014509011 tokens/s +2024-07-30 13:55:29,717 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:29,717 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[409/2067], cost time 1.5559s, every example cost time is 1.5559, generate speed: 12.8540 tokens/s, avg speed: 10.6293 tokens/s, remaining time: 0:38:16 +pred is: + ['Baptismal theology'] + label is: + ['baptism'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:55:29,824 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:29,825 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 142, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:29,825 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:29,825 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:29,826 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:30,767 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:30,799 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:30,831 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:30,885 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:30,917 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:30,948 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:30,979 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:31,010 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:31,041 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:31,072 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:31,385 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5595004558563232 s; generated tokens: 20 tokens; generate speed: 12.824619527935937 tokens/s +2024-07-30 13:55:31,390 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:31,390 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[410/2067], cost time 1.5953s, every example cost time is 1.5953, generate speed: 12.5367 tokens/s, avg speed: 10.6347 tokens/s, remaining time: 0:38:15 +pred is: + ['In early Lutheran hymnals'] + label is: + ['early Lutheran hymnals'] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +F1 score: 63.48609506421053, Em score: 51.21951219512195, current_count: 410 +2024-07-30 13:55:31,573 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:31,574 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 225, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:31,574 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:31,574 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:31,574 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:32,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:32,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:32,583 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:32,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:32,645 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:32,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:32,707 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:32,738 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:32,768 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:32,799 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:33,108 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5337398052215576 s; generated tokens: 20 tokens; generate speed: 13.040021476857271 tokens/s +2024-07-30 13:55:33,113 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:33,113 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[411/2067], cost time 1.5449s, every example cost time is 1.5449, generate speed: 12.9456 tokens/s, avg speed: 10.6410 tokens/s, remaining time: 0:38:14 +pred is: + ['Johann Sebastian Bach'] + label is: + ['Johann Sebastian Bach'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:55:33,195 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:33,195 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 230, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:33,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:33,196 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:33,196 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:34,139 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:34,172 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:34,203 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:34,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:34,265 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:34,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:34,326 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:34,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:34,388 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:34,419 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:34,726 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5294947624206543 s; generated tokens: 20 tokens; generate speed: 13.076213460415522 tokens/s +2024-07-30 13:55:34,731 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:34,731 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[412/2067], cost time 1.5407s, every example cost time is 1.5407, generate speed: 12.9811 tokens/s, avg speed: 10.6473 tokens/s, remaining time: 0:38:14 +pred is: + ['It sleeps in peace'] + label is: + ['sleeps'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 13:55:34,813 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:34,814 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 113, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:34,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:34,814 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:34,815 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:35,756 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:35,788 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:35,818 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:35,849 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:35,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:35,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:35,941 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:35,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:36,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:36,033 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:36,359 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5438172817230225 s; generated tokens: 20 tokens; generate speed: 12.954900969678494 tokens/s +2024-07-30 13:55:36,363 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:36,364 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[413/2067], cost time 1.5550s, every example cost time is 1.5550, generate speed: 12.8617 tokens/s, avg speed: 10.6533 tokens/s, remaining time: 0:38:13 +pred is: + ['Franz Pieper'] + label is: + ['Franz Pieper'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:55:36,446 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:36,447 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 192, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:36,447 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:36,447 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:36,447 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:37,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:37,422 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:37,453 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:37,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:37,515 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:37,546 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:37,576 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:37,607 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:37,638 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:37,669 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:37,977 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5291047096252441 s; generated tokens: 20 tokens; generate speed: 13.079549015908556 tokens/s +2024-07-30 13:55:37,981 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:37,982 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[414/2067], cost time 1.5403s, every example cost time is 1.5403, generate speed: 12.9849 tokens/s, avg speed: 10.6595 tokens/s, remaining time: 0:38:12 +pred is: + ['In his Commentary on Genesis'] + label is: + ['Commentary on Genesis'] +The F1/Em of this example is: {'F1': 71.42857142857143, 'Em': 0.0} +2024-07-30 13:55:38,064 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:38,064 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 135, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:38,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:38,065 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:38,065 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:39,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:39,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:39,072 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:39,104 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:39,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:39,165 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:39,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:39,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:39,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:39,288 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:39,597 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5317983627319336 s; generated tokens: 20 tokens; generate speed: 13.056548751188359 tokens/s +2024-07-30 13:55:39,602 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:39,602 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[415/2067], cost time 1.5429s, every example cost time is 1.5429, generate speed: 12.9622 tokens/s, avg speed: 10.6657 tokens/s, remaining time: 0:38:11 +pred is: + ['October 1529'] + label is: + ['October 1529'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:55:39,684 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:39,684 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 303, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:39,685 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:39,685 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:39,685 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:40,629 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:40,661 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:40,692 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:40,723 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:40,754 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:40,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:40,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:40,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:40,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:40,909 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:41,218 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5330770015716553 s; generated tokens: 20 tokens; generate speed: 13.045659141384759 tokens/s +2024-07-30 13:55:41,223 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:41,223 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[416/2067], cost time 1.5441s, every example cost time is 1.5441, generate speed: 12.9526 tokens/s, avg speed: 10.6718 tokens/s, remaining time: 0:38:11 +pred is: + ['The significance of the words spoken by Jesus at the Last Supper'] + label is: + ['words spoken by Jesus'] +The F1/Em of this example is: {'F1': 46.666666666666664, 'Em': 0.0} +2024-07-30 13:55:41,307 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:41,307 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 137, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:41,308 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:41,308 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:41,308 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:42,250 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:42,282 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:42,339 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:42,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:42,375 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.066960334777832 s; generated tokens: 4 tokens; generate speed: 3.748967857209894 tokens/s +2024-07-30 13:55:42,380 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:42,380 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[417/2067], cost time 1.0780s, every example cost time is 1.0780, generate speed: 3.7104 tokens/s, avg speed: 10.6588 tokens/s, remaining time: 0:38:08 +pred is: + ['1530'] + label is: + ['1530'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:55:42,462 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:42,463 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 414, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:42,463 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:42,463 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:42,463 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:43,410 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:43,442 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:43,474 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:43,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:43,536 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:43,567 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:43,598 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:43,629 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:43,660 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:43,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:44,002 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5383098125457764 s; generated tokens: 20 tokens; generate speed: 13.001282210442149 tokens/s +2024-07-30 13:55:44,007 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:44,007 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[418/2067], cost time 1.5494s, every example cost time is 1.5494, generate speed: 12.9082 tokens/s, avg speed: 10.6649 tokens/s, remaining time: 0:38:07 +pred is: + ['antithetical'] + label is: + ['antithetical'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:55:44,089 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:44,089 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 261, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:44,089 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:44,090 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:44,090 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:45,034 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:45,066 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:45,098 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:45,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:45,160 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:45,191 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:45,222 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:45,252 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:45,284 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:45,314 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:45,625 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.535165786743164 s; generated tokens: 20 tokens; generate speed: 13.027908889521152 tokens/s +2024-07-30 13:55:45,630 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:45,630 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[419/2067], cost time 1.5462s, every example cost time is 1.5462, generate speed: 12.9347 tokens/s, avg speed: 10.6709 tokens/s, remaining time: 0:38:07 +pred is: + ['He stated that Jesus Christ was born a Jew.'] + label is: + ['Jesus Christ was born a Jew'] +The F1/Em of this example is: {'F1': 75.86206896551725, 'Em': 0.0} +2024-07-30 13:55:45,713 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:45,713 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 332, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:45,713 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:45,714 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:45,714 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:46,659 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:46,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:46,722 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:46,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:46,784 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:46,815 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:46,846 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:46,877 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:46,908 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:46,939 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:47,255 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5411739349365234 s; generated tokens: 20 tokens; generate speed: 12.977120587510937 tokens/s +2024-07-30 13:55:47,260 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:47,260 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[420/2067], cost time 1.5524s, every example cost time is 1.5524, generate speed: 12.8833 tokens/s, avg speed: 10.6768 tokens/s, remaining time: 0:38:06 +pred is: + ['As agents of the Biblical apocalypse that would destroy the antichrist, whom Luther believed to be'] + label is: + ['as a scourge'] +The F1/Em of this example is: {'F1': 10.81081081081081, 'Em': 0.0} +F1 score: 63.71206450999496, Em score: 51.19047619047619, current_count: 420 +2024-07-30 13:55:47,447 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:47,447 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 148, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:47,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:47,448 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:47,448 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:48,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:48,424 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:48,455 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:48,486 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:48,517 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:48,548 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:48,579 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:48,610 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:48,640 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:48,671 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:48,987 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.538548469543457 s; generated tokens: 20 tokens; generate speed: 12.999265473862337 tokens/s +2024-07-30 13:55:48,992 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:48,992 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[421/2067], cost time 1.5498s, every example cost time is 1.5498, generate speed: 12.9051 tokens/s, avg speed: 10.6827 tokens/s, remaining time: 0:38:05 +pred is: + ['Quran'] + label is: + ["Qur'an"] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:55:49,075 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:49,075 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 257, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:49,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:49,076 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:49,076 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:50,020 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:50,052 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:50,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:50,115 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:50,146 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:50,177 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:50,208 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:50,239 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:50,270 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:50,301 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:50,610 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5336828231811523 s; generated tokens: 20 tokens; generate speed: 13.040505962318965 tokens/s +2024-07-30 13:55:50,615 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:50,615 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[422/2067], cost time 1.5448s, every example cost time is 1.5448, generate speed: 12.9463 tokens/s, avg speed: 10.6887 tokens/s, remaining time: 0:38:04 +pred is: + ["God's wrath to Christians"] + label is: + ["God's wrath to Christians"] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:55:50,697 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:50,697 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 242, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:50,697 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:50,698 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:50,698 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:51,642 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:51,674 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:51,706 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:51,737 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:51,768 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:51,799 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:51,830 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:51,860 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:51,891 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:51,922 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:52,234 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5354375839233398 s; generated tokens: 20 tokens; generate speed: 13.025602739836636 tokens/s +2024-07-30 13:55:52,238 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:52,239 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[423/2067], cost time 1.5466s, every example cost time is 1.5466, generate speed: 12.9319 tokens/s, avg speed: 10.6946 tokens/s, remaining time: 0:38:04 +pred is: + ["The law as the Holy Spirit's tool to work sorrow over sin in man's heart, thus"] + label is: + ['second use of the law'] +The F1/Em of this example is: {'F1': 13.333333333333334, 'Em': 0.0} +2024-07-30 13:55:52,321 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:52,321 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 155, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:52,322 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:52,322 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:52,322 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:53,264 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:53,296 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:53,327 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:53,358 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:53,389 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:53,420 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:53,451 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:53,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:53,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:53,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:53,852 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5293972492218018 s; generated tokens: 20 tokens; generate speed: 13.07704718978443 tokens/s +2024-07-30 13:55:53,856 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:53,857 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[424/2067], cost time 1.5405s, every example cost time is 1.5405, generate speed: 12.9828 tokens/s, avg speed: 10.7005 tokens/s, remaining time: 0:38:03 +pred is: + ['Follow them in their vocations on a daily basis'] + label is: + ['ought to live'] +The F1/Em of this example is: {'F1': 9.09090909090909, 'Em': 0.0} +2024-07-30 13:55:53,939 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:53,940 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 149, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:53,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:53,940 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:53,941 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:54,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:54,915 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:54,947 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:54,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:55,008 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:55,039 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:55,070 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:55,101 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:55,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:55,162 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:55,470 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5294032096862793 s; generated tokens: 20 tokens; generate speed: 13.076996225280922 tokens/s +2024-07-30 13:55:55,475 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:55,475 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[425/2067], cost time 1.5405s, every example cost time is 1.5405, generate speed: 12.9824 tokens/s, avg speed: 10.7065 tokens/s, remaining time: 0:38:02 +pred is: + ['baptism'] + label is: + ['baptism'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:55:55,557 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:55,558 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 328, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:55,558 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:55,558 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:55,558 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:56,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:56,535 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:56,567 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:56,598 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:56,629 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:56,660 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:56,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:56,722 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:56,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:56,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:57,094 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5353672504425049 s; generated tokens: 20 tokens; generate speed: 13.026199428336017 tokens/s +2024-07-30 13:55:57,099 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:57,099 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[426/2067], cost time 1.5467s, every example cost time is 1.5467, generate speed: 12.9306 tokens/s, avg speed: 10.7123 tokens/s, remaining time: 0:38:01 +pred is: + ["He wanted to marry one of his wife's ladies-in-waiting."] + label is: + ['wanted to marry'] +The F1/Em of this example is: {'F1': 40.0, 'Em': 0.0} +2024-07-30 13:55:57,189 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:57,189 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 299, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:57,190 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:57,190 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:57,190 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:58,135 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:58,167 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:58,198 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:58,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:58,260 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:58,291 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:58,322 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:58,353 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:58,384 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:58,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:58,728 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5378024578094482 s; generated tokens: 20 tokens; generate speed: 13.005571618404991 tokens/s +2024-07-30 13:55:58,733 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:55:58,733 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[427/2067], cost time 1.5492s, every example cost time is 1.5492, generate speed: 12.9096 tokens/s, avg speed: 10.7180 tokens/s, remaining time: 0:38:00 +pred is: + ['expelled'] + label is: + ['expelled Jews'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:55:58,815 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:55:58,816 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 350, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:55:58,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:58,816 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:55:58,817 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:55:59,762 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:59,795 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:59,826 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:59,864 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:59,895 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:59,926 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:59,957 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:55:59,989 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:00,020 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:00,051 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:00,362 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5452866554260254 s; generated tokens: 20 tokens; generate speed: 12.942582484468637 tokens/s +2024-07-30 13:56:00,367 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:00,367 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[428/2067], cost time 1.5564s, every example cost time is 1.5564, generate speed: 12.8499 tokens/s, avg speed: 10.7236 tokens/s, remaining time: 0:38:00 +pred is: + ['Von den Juden und Ihren Lügen'] + label is: + ['Von den Juden und Ihren Lügen'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:56:00,450 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:00,450 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 216, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:00,450 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:00,451 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:00,451 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:01,394 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:01,426 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:01,458 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:01,489 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:01,519 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:01,550 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:01,581 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:01,612 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:01,643 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:01,674 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:01,983 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5318353176116943 s; generated tokens: 20 tokens; generate speed: 13.056233767466777 tokens/s +2024-07-30 13:56:01,988 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:01,988 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[429/2067], cost time 1.5431s, every example cost time is 1.5431, generate speed: 12.9607 tokens/s, avg speed: 10.7294 tokens/s, remaining time: 0:37:59 +pred is: + ['Jews'] + label is: + ['the Jews'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:56:02,070 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:02,071 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 304, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:02,071 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:02,071 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:02,071 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:03,016 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:03,048 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:03,079 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:03,110 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:03,141 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:03,172 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:03,203 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:03,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:03,265 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:03,268 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1964783668518066 s; generated tokens: 9 tokens; generate speed: 7.522074990524857 tokens/s +2024-07-30 13:56:03,273 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:03,273 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[430/2067], cost time 1.2076s, every example cost time is 1.2076, generate speed: 7.4529 tokens/s, avg speed: 10.7228 tokens/s, remaining time: 0:37:57 +pred is: + ['Luther'] + label is: + ['Luther'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 63.53835194563283, Em score: 50.93023255813954, current_count: 430 +2024-07-30 13:56:03,463 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:03,463 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 255, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:03,464 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:03,464 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:03,464 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:04,408 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:04,440 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:04,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:04,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:04,533 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:04,564 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:04,595 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:04,626 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:04,657 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:04,688 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:04,997 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5323495864868164 s; generated tokens: 20 tokens; generate speed: 13.051851990154253 tokens/s +2024-07-30 13:56:05,001 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:05,002 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[431/2067], cost time 1.5439s, every example cost time is 1.5439, generate speed: 12.9542 tokens/s, avg speed: 10.7285 tokens/s, remaining time: 0:37:56 +pred is: + ['17 December 1941'] + label is: + ['17 December 1941'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:56:05,085 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:05,085 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 331, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:05,086 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:05,086 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:05,086 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:06,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:06,065 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:06,097 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:06,130 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:06,161 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:06,192 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:06,223 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:06,254 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:06,285 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:06,316 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:06,626 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5396919250488281 s; generated tokens: 20 tokens; generate speed: 12.989611541520386 tokens/s +2024-07-30 13:56:06,631 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:06,631 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[432/2067], cost time 1.5510s, every example cost time is 1.5510, generate speed: 12.8951 tokens/s, avg speed: 10.7341 tokens/s, remaining time: 0:37:55 +pred is: + ['Opportunistic'] + label is: + ['opportunistic'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:56:06,713 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:06,714 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 236, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:06,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:06,714 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:06,715 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:07,658 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:07,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:07,722 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:07,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:07,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:07,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:07,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:07,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:07,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:07,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:08,002 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.286849021911621 s; generated tokens: 12 tokens; generate speed: 9.32510325272963 tokens/s +2024-07-30 13:56:08,006 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:08,007 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[433/2067], cost time 1.2980s, every example cost time is 1.2980, generate speed: 9.2452 tokens/s, avg speed: 10.7309 tokens/s, remaining time: 0:37:53 +pred is: + ['violence'] + label is: + ['violence'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:56:08,095 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:08,096 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 165, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:08,096 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:08,096 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:08,097 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:09,039 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:09,071 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:09,102 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:09,133 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:09,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:09,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:09,225 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:09,256 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:09,287 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:09,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:09,639 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.542130947113037 s; generated tokens: 20 tokens; generate speed: 12.969067275020462 tokens/s +2024-07-30 13:56:09,644 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:09,644 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[434/2067], cost time 1.5537s, every example cost time is 1.5537, generate speed: 12.8725 tokens/s, avg speed: 10.7364 tokens/s, remaining time: 0:37:53 +pred is: + ["Luther's declining health"] + label is: + ['declining state of mind'] +The F1/Em of this example is: {'F1': 28.57142857142857, 'Em': 0.0} +2024-07-30 13:56:09,727 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:09,727 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 223, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:09,727 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:09,728 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:09,728 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:10,671 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:10,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:10,736 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:10,767 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:10,797 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:10,829 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:10,861 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:10,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:10,923 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:10,953 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:11,263 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5347926616668701 s; generated tokens: 20 tokens; generate speed: 13.03107611830701 tokens/s +2024-07-30 13:56:11,268 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:11,268 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[435/2067], cost time 1.5459s, every example cost time is 1.5459, generate speed: 12.9371 tokens/s, avg speed: 10.7420 tokens/s, remaining time: 0:37:52 +pred is: + ['1980s'] + label is: + ['Since the 1980s'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +2024-07-30 13:56:11,350 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:11,350 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 199, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:11,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:11,351 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:11,351 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:12,294 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:12,327 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:12,358 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:12,389 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:12,420 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:12,451 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:12,454 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1022632122039795 s; generated tokens: 6 tokens; generate speed: 5.443345957271836 tokens/s +2024-07-30 13:56:12,458 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:12,459 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[436/2067], cost time 1.1134s, every example cost time is 1.1134, generate speed: 5.3888 tokens/s, avg speed: 10.7322 tokens/s, remaining time: 0:37:49 +pred is: + ['Deteriorated'] + label is: + ['his health deteriorated'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +2024-07-30 13:56:12,541 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:12,541 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 130, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:12,542 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:12,542 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:12,542 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:13,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:13,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:13,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:13,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:13,609 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:13,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:13,642 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0997233390808105 s; generated tokens: 6 tokens; generate speed: 5.455917671998325 tokens/s +2024-07-30 13:56:13,647 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:13,647 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[437/2067], cost time 1.1109s, every example cost time is 1.1109, generate speed: 5.4010 tokens/s, avg speed: 10.7225 tokens/s, remaining time: 0:37:47 +pred is: + ['His poor physical health'] + label is: + ['poor physical health'] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +2024-07-30 13:56:13,730 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:13,730 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 204, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:13,730 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:13,731 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:13,731 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:14,674 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:14,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:14,736 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:14,767 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:14,798 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:14,829 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:14,860 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:14,891 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:14,922 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:14,953 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:15,265 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5337786674499512 s; generated tokens: 20 tokens; generate speed: 13.039691074365932 tokens/s +2024-07-30 13:56:15,270 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:15,270 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[438/2067], cost time 1.5449s, every example cost time is 1.5449, generate speed: 12.9459 tokens/s, avg speed: 10.7281 tokens/s, remaining time: 0:37:46 +pred is: + ['Eisleben'] + label is: + ['Eisleben'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:56:15,353 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:15,353 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 158, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:15,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:15,354 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:15,354 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:16,296 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:16,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:16,361 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:16,393 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:16,424 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:16,455 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:16,486 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:16,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:16,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:16,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:16,856 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5016686916351318 s; generated tokens: 19 tokens; generate speed: 12.65259115132203 tokens/s +2024-07-30 13:56:16,861 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:16,861 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[439/2067], cost time 1.5129s, every example cost time is 1.5129, generate speed: 12.5590 tokens/s, avg speed: 10.7326 tokens/s, remaining time: 0:37:45 +pred is: + ['Mansfeld'] + label is: + ['Mansfeld'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:56:16,942 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:16,943 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 206, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:16,943 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:16,943 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:16,943 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:17,886 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:17,918 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:17,949 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:17,980 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:18,011 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:18,041 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:18,072 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:18,103 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:18,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:18,165 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:18,473 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5296452045440674 s; generated tokens: 20 tokens; generate speed: 13.074927401848905 tokens/s +2024-07-30 13:56:18,478 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:18,478 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[440/2067], cost time 1.5407s, every example cost time is 1.5407, generate speed: 12.9814 tokens/s, avg speed: 10.7383 tokens/s, remaining time: 0:37:44 +pred is: + ['17 February 1546'] + label is: + ['17 February 1546'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 63.86377901180351, Em score: 51.13636363636363, current_count: 440 +2024-07-30 13:56:18,669 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:18,670 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 158, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:18,670 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:18,670 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:18,671 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:19,613 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:19,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:19,677 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:19,709 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:19,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:19,770 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:19,773 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1024832725524902 s; generated tokens: 6 tokens; generate speed: 5.442259442275878 tokens/s +2024-07-30 13:56:19,778 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:19,778 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[441/2067], cost time 1.1137s, every example cost time is 1.1137, generate speed: 5.3874 tokens/s, avg speed: 10.7286 tokens/s, remaining time: 0:37:42 +pred is: + ['Apoplectic stroke'] + label is: + ['apoplectic stroke'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:56:19,860 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:19,861 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 81, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:19,861 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:19,861 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:19,862 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:20,803 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:20,835 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:20,867 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:20,898 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:20,928 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:20,959 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:20,989 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:21,020 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:21,051 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:21,082 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:21,389 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5267667770385742 s; generated tokens: 20 tokens; generate speed: 13.099577683235568 tokens/s +2024-07-30 13:56:21,393 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:21,394 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[442/2067], cost time 1.5379s, every example cost time is 1.5379, generate speed: 13.0044 tokens/s, avg speed: 10.7343 tokens/s, remaining time: 0:37:41 +pred is: + ['"We are beggars"'] + label is: + ['his last statement'] +The F1/Em of this example is: {'F1': 16.666666666666664, 'Em': 0.0} +2024-07-30 13:56:21,476 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:21,476 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 219, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:21,477 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:21,477 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:21,477 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:22,420 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:22,452 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:22,483 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:22,514 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:22,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:22,576 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:22,607 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:22,638 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:22,669 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:22,700 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:23,009 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5313451290130615 s; generated tokens: 20 tokens; generate speed: 13.060413110720393 tokens/s +2024-07-30 13:56:23,013 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:23,014 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[443/2067], cost time 1.5426s, every example cost time is 1.5426, generate speed: 12.9649 tokens/s, avg speed: 10.7398 tokens/s, remaining time: 0:37:40 +pred is: + ['Images that emphasized his monumental size'] + label is: + ['monumental'] +The F1/Em of this example is: {'F1': 16.666666666666668, 'Em': 0.0} +2024-07-30 13:56:23,096 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:23,097 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 98, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:23,097 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:23,097 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:23,098 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:24,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:24,070 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:24,101 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:24,132 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:24,163 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:24,193 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:24,224 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:24,255 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:24,286 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:24,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:24,629 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5308756828308105 s; generated tokens: 20 tokens; generate speed: 13.064418113309571 tokens/s +2024-07-30 13:56:24,634 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:24,634 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[444/2067], cost time 1.5424s, every example cost time is 1.5424, generate speed: 12.9668 tokens/s, avg speed: 10.7454 tokens/s, remaining time: 0:37:39 +pred is: + ['18 February'] + label is: + ['18 February'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:56:24,717 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:24,717 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 154, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:24,717 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:24,718 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:24,718 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:25,660 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:25,693 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:25,724 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:25,755 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:25,786 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:25,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:25,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:25,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:25,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:25,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:26,249 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5306553840637207 s; generated tokens: 20 tokens; generate speed: 13.066298402781044 tokens/s +2024-07-30 13:56:26,253 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:26,254 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[445/2067], cost time 1.5418s, every example cost time is 1.5418, generate speed: 12.9716 tokens/s, avg speed: 10.7509 tokens/s, remaining time: 0:37:38 +pred is: + ['SoCal'] + label is: + ['SoCal'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:56:26,336 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:26,336 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 125, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:26,337 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:26,337 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:26,337 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:27,278 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:27,311 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:27,342 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:27,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:27,404 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:27,435 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:27,466 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:27,497 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:27,528 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:27,531 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1931970119476318 s; generated tokens: 9 tokens; generate speed: 7.542761094674113 tokens/s +2024-07-30 13:56:27,535 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:27,536 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[446/2067], cost time 1.2043s, every example cost time is 1.2043, generate speed: 7.4734 tokens/s, avg speed: 10.7446 tokens/s, remaining time: 0:37:36 +pred is: + ['Greater Southern California Megaregion'] + label is: + ['Southern California Megaregion'] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +2024-07-30 13:56:27,618 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:27,619 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 267, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:27,619 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:27,620 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:27,620 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:28,563 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:28,595 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:28,626 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:28,629 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0090653896331787 s; generated tokens: 3 tokens; generate speed: 2.9730481600311127 tokens/s +2024-07-30 13:56:28,634 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:28,634 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[447/2067], cost time 1.0203s, every example cost time is 1.0203, generate speed: 2.9403 tokens/s, avg speed: 10.7318 tokens/s, remaining time: 0:37:34 +pred is: + ['Pacific'] + label is: + ['Pacific'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:56:28,715 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:28,716 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 95, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:28,716 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:28,716 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:28,717 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:29,658 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:29,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:29,722 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:29,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:29,790 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:29,821 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:29,852 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:29,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:29,914 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:29,945 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:30,253 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5358295440673828 s; generated tokens: 20 tokens; generate speed: 13.022278466550011 tokens/s +2024-07-30 13:56:30,257 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:30,258 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[448/2067], cost time 1.5470s, every example cost time is 1.5470, generate speed: 12.9285 tokens/s, avg speed: 10.7372 tokens/s, remaining time: 0:37:33 +pred is: + ['Colorado River'] + label is: + ['Colorado River'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:56:30,340 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:30,340 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 144, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:30,340 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:30,341 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:30,341 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:31,283 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:31,315 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:31,347 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:31,378 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:31,408 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:31,439 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:31,470 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:31,501 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:31,532 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:31,563 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:31,873 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.531782865524292 s; generated tokens: 20 tokens; generate speed: 13.05668084565921 tokens/s +2024-07-30 13:56:31,878 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:31,878 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[449/2067], cost time 1.5431s, every example cost time is 1.5431, generate speed: 12.9613 tokens/s, avg speed: 10.7427 tokens/s, remaining time: 0:37:32 +pred is: + ['California'] + label is: + ['California'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:56:31,960 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:31,960 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 104, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:31,960 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:31,960 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:31,961 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:32,902 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:32,934 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:32,965 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:32,996 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:33,027 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:33,058 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:33,088 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:33,119 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:33,150 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:33,181 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:33,490 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5291731357574463 s; generated tokens: 20 tokens; generate speed: 13.078963743430783 tokens/s +2024-07-30 13:56:33,495 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:33,495 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[450/2067], cost time 1.5405s, every example cost time is 1.5405, generate speed: 12.9830 tokens/s, avg speed: 10.7482 tokens/s, remaining time: 0:37:31 +pred is: + ['Los Angeles'] + label is: + ['Los Angeles'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.25939873746714, Em score: 51.55555555555556, current_count: 450 +2024-07-30 13:56:33,689 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:33,689 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 144, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:33,690 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:33,690 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:33,690 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:34,632 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:34,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:34,667 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 0.9765338897705078 s; generated tokens: 2 tokens; generate speed: 2.048060001757864 tokens/s +2024-07-30 13:56:34,672 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:34,672 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[451/2067], cost time 0.9877s, every example cost time is 0.9877, generate speed: 2.0249 tokens/s, avg speed: 10.7345 tokens/s, remaining time: 0:37:28 +pred is: + ['Hollywood'] + label is: + ['Hollywood'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:56:34,754 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:34,754 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 303, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:34,755 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:34,755 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:34,755 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:35,699 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:35,731 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:35,763 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:35,794 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:35,825 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:35,856 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:35,888 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:35,919 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:35,950 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:35,980 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:36,290 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5350768566131592 s; generated tokens: 20 tokens; generate speed: 13.028663622827334 tokens/s +2024-07-30 13:56:36,295 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:36,295 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[452/2067], cost time 1.5463s, every example cost time is 1.5463, generate speed: 12.9341 tokens/s, avg speed: 10.7399 tokens/s, remaining time: 0:37:27 +pred is: + ['Skateboard'] + label is: + ['skateboard'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:56:36,378 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:36,378 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 79, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:36,379 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:36,379 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:36,379 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:37,320 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:37,353 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:37,384 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:37,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:37,446 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:37,449 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0696070194244385 s; generated tokens: 5 tokens; generate speed: 4.674614049083679 tokens/s +2024-07-30 13:56:37,453 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:37,454 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[453/2067], cost time 1.0809s, every example cost time is 1.0809, generate speed: 4.6259 tokens/s, avg speed: 10.7294 tokens/s, remaining time: 0:37:25 +pred is: + ['Palm Springs'] + label is: + ['Palm Springs'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:56:37,536 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:37,536 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 223, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:37,537 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:37,537 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:37,537 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:38,480 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:38,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:38,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:38,574 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:38,605 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:38,636 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:38,667 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:38,697 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:38,728 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:38,759 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:38,823 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2863216400146484 s; generated tokens: 12 tokens; generate speed: 9.328926472747007 tokens/s +2024-07-30 13:56:38,828 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:38,828 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[454/2067], cost time 1.2974s, every example cost time is 1.2974, generate speed: 9.2492 tokens/s, avg speed: 10.7264 tokens/s, remaining time: 0:37:23 +pred is: + ['37° 9\' 58.23"'] + label is: + ['37° 9\' 58.23"'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:56:38,915 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:38,915 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 182, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:38,915 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:38,916 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:38,916 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:39,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:39,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:39,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:39,955 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:39,986 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:40,016 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:40,048 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:40,078 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:40,081 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.16524076461792 s; generated tokens: 8 tokens; generate speed: 6.86553392476205 tokens/s +2024-07-30 13:56:40,086 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:40,086 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[455/2067], cost time 1.1767s, every example cost time is 1.1767, generate speed: 6.7985 tokens/s, avg speed: 10.7191 tokens/s, remaining time: 0:37:21 +pred is: + ['Mexico'] + label is: + ['Mexico'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:56:40,169 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:40,169 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 252, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:40,169 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:40,170 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:40,170 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:41,114 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:41,146 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:41,178 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:41,214 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:41,217 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0474145412445068 s; generated tokens: 4 tokens; generate speed: 3.818927313389519 tokens/s +2024-07-30 13:56:41,222 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:41,222 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[456/2067], cost time 1.0585s, every example cost time is 1.0585, generate speed: 3.7789 tokens/s, avg speed: 10.7075 tokens/s, remaining time: 0:37:19 +pred is: + ['Taxes'] + label is: + ['inequitable taxes'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:56:41,305 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:41,305 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 99, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:41,305 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:41,306 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:41,306 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:42,248 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:42,279 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:42,310 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:42,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:42,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:42,403 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:42,434 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:42,465 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:42,496 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:42,527 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:42,836 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5301334857940674 s; generated tokens: 20 tokens; generate speed: 13.070755058746355 tokens/s +2024-07-30 13:56:42,841 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:42,841 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[457/2067], cost time 1.5413s, every example cost time is 1.5413, generate speed: 12.9762 tokens/s, avg speed: 10.7130 tokens/s, remaining time: 0:37:18 +pred is: + ['The Los Angeles Times'] + label is: + ['Los Angeles Times'] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +2024-07-30 13:56:42,924 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:42,924 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 201, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:42,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:42,925 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:42,925 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:43,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:43,902 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:43,935 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:43,967 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:43,998 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:44,029 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:44,061 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:44,092 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:44,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:44,154 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:44,464 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5392143726348877 s; generated tokens: 20 tokens; generate speed: 12.993641662638073 tokens/s +2024-07-30 13:56:44,469 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:44,469 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[458/2067], cost time 1.5503s, every example cost time is 1.5503, generate speed: 12.9005 tokens/s, avg speed: 10.7183 tokens/s, remaining time: 0:37:17 +pred is: + ['The state is most commonly divided and promoted by its regional tourism groups as consisting of northern, central'] + label is: + ['regional tourism groups'] +The F1/Em of this example is: {'F1': 24.39024390243903, 'Em': 0.0} +2024-07-30 13:56:44,552 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:44,553 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 216, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:44,553 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:44,553 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:44,554 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:45,497 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:45,529 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:45,560 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:45,612 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:45,644 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:45,675 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:45,706 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:45,737 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:45,768 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:45,799 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:46,110 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5562686920166016 s; generated tokens: 20 tokens; generate speed: 12.851251266954517 tokens/s +2024-07-30 13:56:46,115 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:46,115 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[459/2067], cost time 1.5674s, every example cost time is 1.5674, generate speed: 12.7598 tokens/s, avg speed: 10.7233 tokens/s, remaining time: 0:37:16 +pred is: + ['3rd'] + label is: + ['third'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:56:46,197 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:46,198 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 245, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:46,198 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:46,198 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:46,199 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:47,142 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:47,174 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:47,205 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:47,236 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:47,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:47,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:47,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:47,360 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:47,391 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:47,422 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:47,517 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.318161964416504 s; generated tokens: 13 tokens; generate speed: 9.862217505080695 tokens/s +2024-07-30 13:56:47,522 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:47,522 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[460/2067], cost time 1.3292s, every example cost time is 1.3292, generate speed: 9.7807 tokens/s, avg speed: 10.7214 tokens/s, remaining time: 0:37:14 +pred is: + ['Camp Pendleton'] + label is: + ['Camp Pendleton'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.50968045455649, Em score: 51.73913043478261, current_count: 460 +2024-07-30 13:56:47,745 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:47,745 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 138, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:47,746 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:47,746 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:47,746 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:48,688 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:48,721 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:48,752 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:48,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:48,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:48,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:48,847 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1011395454406738 s; generated tokens: 6 tokens; generate speed: 5.448900663719976 tokens/s +2024-07-30 13:56:48,852 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:48,852 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[461/2067], cost time 1.1126s, every example cost time is 1.1126, generate speed: 5.3930 tokens/s, avg speed: 10.7121 tokens/s, remaining time: 0:37:12 +pred is: + ['Mediterranean'] + label is: + ['Mediterranean'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:56:48,935 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:48,936 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 133, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:48,936 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:48,936 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:48,936 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:49,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:49,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:49,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:49,973 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:50,004 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:50,035 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:50,066 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:50,097 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:50,127 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:50,158 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:50,466 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5293774604797363 s; generated tokens: 20 tokens; generate speed: 13.077216394784832 tokens/s +2024-07-30 13:56:50,471 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:50,471 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[462/2067], cost time 1.5405s, every example cost time is 1.5405, generate speed: 12.9827 tokens/s, avg speed: 10.7176 tokens/s, remaining time: 0:37:11 +pred is: + ['1'] + label is: + ['Pacific Ocean'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:56:50,553 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:50,553 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 156, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:50,554 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:50,554 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:50,554 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:51,497 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:51,529 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:51,561 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:51,592 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:51,622 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:51,625 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0707461833953857 s; generated tokens: 5 tokens; generate speed: 4.66964073982946 tokens/s +2024-07-30 13:56:51,630 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:51,630 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[463/2067], cost time 1.0818s, every example cost time is 1.0818, generate speed: 4.6219 tokens/s, avg speed: 10.7073 tokens/s, remaining time: 0:37:09 +pred is: + ['10,000'] + label is: + ['10,000'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:56:51,713 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:51,713 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 125, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:51,713 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:51,713 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:51,714 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:52,656 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:52,688 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:52,719 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:52,750 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:52,781 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:52,811 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:52,842 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:52,873 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:52,903 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:52,934 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:53,241 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5267565250396729 s; generated tokens: 20 tokens; generate speed: 13.09966564543112 tokens/s +2024-07-30 13:56:53,245 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:53,246 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[464/2067], cost time 1.5378s, every example cost time is 1.5378, generate speed: 13.0055 tokens/s, avg speed: 10.7128 tokens/s, remaining time: 0:37:08 +pred is: + ['San Andreas Fault'] + label is: + ['San Andreas'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 13:56:53,328 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:53,328 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 130, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:53,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:53,329 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:53,329 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:54,270 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:54,302 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:54,333 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:54,364 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:54,395 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:54,398 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0687892436981201 s; generated tokens: 5 tokens; generate speed: 4.6781907934435125 tokens/s +2024-07-30 13:56:54,405 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:54,405 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[465/2067], cost time 1.0817s, every example cost time is 1.0817, generate speed: 4.6224 tokens/s, avg speed: 10.7026 tokens/s, remaining time: 0:37:05 +pred is: + ['economically'] + label is: + ['economically'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:56:54,487 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:54,488 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 143, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:54,488 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:54,488 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:54,489 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:55,430 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:55,462 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:55,493 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:55,524 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:55,555 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:55,586 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:55,617 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:55,648 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:55,679 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:55,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:55,743 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2541282176971436 s; generated tokens: 11 tokens; generate speed: 8.771033013034687 tokens/s +2024-07-30 13:56:55,748 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:55,748 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[466/2067], cost time 1.2653s, every example cost time is 1.2653, generate speed: 8.6936 tokens/s, avg speed: 10.6987 tokens/s, remaining time: 0:37:04 +pred is: + ['2010'] + label is: + ['2010'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:56:55,830 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:55,830 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 217, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:55,831 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:55,831 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:55,831 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:56,774 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:56,807 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:56,839 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:56,870 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:56,901 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:56,931 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:56,962 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:56,993 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:57,024 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:57,055 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:57,383 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5519912242889404 s; generated tokens: 20 tokens; generate speed: 12.886670805218754 tokens/s +2024-07-30 13:56:57,388 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:57,389 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[467/2067], cost time 1.5632s, every example cost time is 1.5632, generate speed: 12.7942 tokens/s, avg speed: 10.7037 tokens/s, remaining time: 0:37:03 +pred is: + ['Metropolitan Statistical Areas'] + label is: + ['Metropolitan Statistical Areas'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:56:57,471 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:57,472 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 153, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:57,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:57,472 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:57,472 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:58,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:58,447 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:58,478 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:58,509 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:58,512 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0397498607635498 s; generated tokens: 4 tokens; generate speed: 3.8470791398448116 tokens/s +2024-07-30 13:56:58,517 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:56:58,517 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[468/2067], cost time 1.0508s, every example cost time is 1.0508, generate speed: 3.8066 tokens/s, avg speed: 10.6926 tokens/s, remaining time: 0:37:00 +pred is: + ['Los Angeles'] + label is: + ['Los Angeles'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:56:58,599 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:56:58,600 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:56:58,600 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:58,600 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:56:58,601 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:56:59,542 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:59,575 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:59,607 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:59,638 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:59,668 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:59,699 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:59,730 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:59,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:59,791 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:56:59,822 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:00,131 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5298595428466797 s; generated tokens: 20 tokens; generate speed: 13.073095561952755 tokens/s +2024-07-30 13:57:00,135 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:00,136 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[469/2067], cost time 1.5410s, every example cost time is 1.5410, generate speed: 12.9786 tokens/s, avg speed: 10.6980 tokens/s, remaining time: 0:36:59 +pred is: + ['Petroleum'] + label is: + ['petroleum'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:00,217 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:00,217 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 117, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:00,218 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:00,218 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:00,218 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:01,160 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:01,194 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:01,225 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:01,257 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:01,288 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:01,319 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:01,349 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:01,380 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:01,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:01,441 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:01,505 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.286888599395752 s; generated tokens: 12 tokens; generate speed: 9.32481646479307 tokens/s +2024-07-30 13:57:01,510 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:01,510 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[470/2067], cost time 1.2980s, every example cost time is 1.2980, generate speed: 9.2449 tokens/s, avg speed: 10.6951 tokens/s, remaining time: 0:36:58 +pred is: + ['1920s'] + label is: + ['1920s'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.99883618956592, Em score: 52.340425531914896, current_count: 470 +2024-07-30 13:57:01,734 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:01,734 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 91, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:01,735 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:01,735 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:01,735 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:02,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:02,709 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:02,740 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:02,771 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:02,801 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:02,832 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:02,862 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:02,893 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:02,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:02,954 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:03,049 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3135836124420166 s; generated tokens: 13 tokens; generate speed: 9.896591185263311 tokens/s +2024-07-30 13:57:03,053 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:03,054 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[471/2067], cost time 1.3251s, every example cost time is 1.3251, generate speed: 9.8108 tokens/s, avg speed: 10.6933 tokens/s, remaining time: 0:36:56 +pred is: + ['CBD'] + label is: + ['business'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:57:03,136 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:03,137 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 119, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:03,137 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:03,137 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:03,137 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:04,079 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:04,112 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:04,144 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:04,174 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:04,205 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:04,236 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:04,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:04,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:04,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:04,358 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:04,666 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5285263061523438 s; generated tokens: 20 tokens; generate speed: 13.084498395284182 tokens/s +2024-07-30 13:57:04,671 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:04,671 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[472/2067], cost time 1.5397s, every example cost time is 1.5397, generate speed: 12.9897 tokens/s, avg speed: 10.6987 tokens/s, remaining time: 0:36:55 +pred is: + ['1'] + label is: + ['business'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:57:04,753 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:04,754 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 83, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:04,754 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:04,754 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:04,755 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:05,696 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:05,728 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:05,759 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:05,789 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:05,820 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:05,851 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:05,902 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:05,934 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:05,965 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:05,996 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:06,304 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5493042469024658 s; generated tokens: 20 tokens; generate speed: 12.90902031669127 tokens/s +2024-07-30 13:57:06,309 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:06,309 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[473/2067], cost time 1.5605s, every example cost time is 1.5605, generate speed: 12.8165 tokens/s, avg speed: 10.7037 tokens/s, remaining time: 0:36:54 +pred is: + ['Business'] + label is: + ['business'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:06,392 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:06,392 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 111, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:06,393 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:06,393 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:06,393 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:07,335 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:07,368 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:07,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:07,431 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:07,461 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:07,492 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:07,523 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:07,554 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:07,584 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:07,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:07,921 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5279598236083984 s; generated tokens: 20 tokens; generate speed: 13.089349399756083 tokens/s +2024-07-30 13:57:07,955 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:07,955 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[474/2067], cost time 1.5685s, every example cost time is 1.5685, generate speed: 12.7507 tokens/s, avg speed: 10.7086 tokens/s, remaining time: 0:36:54 +pred is: + ['Orange County'] + label is: + ['Orange'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:57:08,038 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:08,038 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 114, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:08,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:08,039 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:08,039 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:08,981 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:09,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:09,044 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:09,075 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:09,105 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:09,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:09,166 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:09,197 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:09,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:09,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:09,580 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5406534671783447 s; generated tokens: 20 tokens; generate speed: 12.981504553797766 tokens/s +2024-07-30 13:57:09,585 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:09,585 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[475/2067], cost time 1.5521s, every example cost time is 1.5521, generate speed: 12.8861 tokens/s, avg speed: 10.7137 tokens/s, remaining time: 0:36:53 +pred is: + ['Downtown San Diego'] + label is: + ['Downtown San Diego'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:09,667 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:09,668 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 157, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:09,668 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:09,668 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:09,669 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:10,611 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:10,643 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:10,674 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:10,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:10,736 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:10,767 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:10,770 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1012165546417236 s; generated tokens: 6 tokens; generate speed: 5.448519616518184 tokens/s +2024-07-30 13:57:10,775 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:10,775 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[476/2067], cost time 1.1127s, every example cost time is 1.1127, generate speed: 5.3925 tokens/s, avg speed: 10.7048 tokens/s, remaining time: 0:36:50 +pred is: + ['Los Angeles International Airport'] + label is: + ['Los Angeles International Airport'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:10,858 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:10,858 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 102, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:10,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:10,859 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:10,859 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:11,800 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:11,832 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:11,863 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:11,894 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:11,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:11,927 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0678224563598633 s; generated tokens: 5 tokens; generate speed: 4.682426343649554 tokens/s +2024-07-30 13:57:11,932 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:11,932 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[477/2067], cost time 1.0791s, every example cost time is 1.0791, generate speed: 4.6336 tokens/s, avg speed: 10.6949 tokens/s, remaining time: 0:36:48 +pred is: + ['Metrolink'] + label is: + ['Metrolink'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:12,014 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:12,014 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 90, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:12,015 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:12,015 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:12,015 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:12,956 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:12,987 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:13,018 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:13,049 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:13,079 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:13,110 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:13,140 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:13,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:13,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:13,232 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:13,565 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5495247840881348 s; generated tokens: 20 tokens; generate speed: 12.907183031454132 tokens/s +2024-07-30 13:57:13,570 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:13,570 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[478/2067], cost time 1.5607s, every example cost time is 1.5607, generate speed: 12.8145 tokens/s, avg speed: 10.6998 tokens/s, remaining time: 0:36:47 +pred is: + ['Port of Los Angeles'] + label is: + ['Port of Los Angeles'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:13,652 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:13,652 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 254, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:13,653 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:13,653 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:13,653 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:14,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:14,629 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:14,660 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:14,690 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:14,721 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:14,752 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:14,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:14,813 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:14,844 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:14,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:15,029 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3757555484771729 s; generated tokens: 15 tokens; generate speed: 10.90309976696335 tokens/s +2024-07-30 13:57:15,034 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:15,034 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[479/2067], cost time 1.3869s, every example cost time is 1.3869, generate speed: 10.8153 tokens/s, avg speed: 10.7001 tokens/s, remaining time: 0:36:46 +pred is: + ['Tech Coast'] + label is: + ['The Tech Coast'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 13:57:15,116 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:15,116 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 113, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:15,117 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:15,117 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:15,117 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:16,059 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:16,091 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:16,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:16,153 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:16,184 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:16,214 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:16,245 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:16,276 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:16,306 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:16,337 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:16,523 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4053092002868652 s; generated tokens: 16 tokens; generate speed: 11.3853947563525 tokens/s +2024-07-30 13:57:16,528 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:16,528 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[480/2067], cost time 1.4165s, every example cost time is 1.4165, generate speed: 11.2956 tokens/s, avg speed: 10.7014 tokens/s, remaining time: 0:36:45 +pred is: + ['NFL'] + label is: + ['NFL'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 65.15511043561663, Em score: 52.5, current_count: 480 +2024-07-30 13:57:16,729 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:16,729 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 114, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:16,730 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:16,730 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:16,730 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:17,672 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:17,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:17,735 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:17,766 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:17,796 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:17,827 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:17,857 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:17,909 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:17,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:17,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:18,277 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5470967292785645 s; generated tokens: 20 tokens; generate speed: 12.9274399082508 tokens/s +2024-07-30 13:57:18,282 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:18,282 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[481/2067], cost time 1.5584s, every example cost time is 1.5584, generate speed: 12.8336 tokens/s, avg speed: 10.7063 tokens/s, remaining time: 0:36:44 +pred is: + ['Chivas USA'] + label is: + ['Chivas USA'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:18,365 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:18,365 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 91, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:18,365 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:18,366 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:18,366 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:19,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:19,339 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:19,370 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:19,401 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:19,432 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:19,463 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:19,494 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:19,524 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:19,556 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:19,588 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:19,896 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5299725532531738 s; generated tokens: 20 tokens; generate speed: 13.072129926431744 tokens/s +2024-07-30 13:57:19,901 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:19,901 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[482/2067], cost time 1.5414s, every example cost time is 1.5414, generate speed: 12.9756 tokens/s, avg speed: 10.7115 tokens/s, remaining time: 0:36:43 +pred is: + ['1'] + label is: + ['College'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:57:20,014 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:20,015 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 79, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:20,015 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:20,015 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:20,016 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:20,957 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:20,989 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:21,020 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:21,051 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:21,083 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:21,113 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:21,144 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:21,175 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:21,206 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:21,237 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:21,362 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3462929725646973 s; generated tokens: 14 tokens; generate speed: 10.398925260175655 tokens/s +2024-07-30 13:57:21,367 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:21,367 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[483/2067], cost time 1.3580s, every example cost time is 1.3580, generate speed: 10.3091 tokens/s, avg speed: 10.7107 tokens/s, remaining time: 0:36:41 +pred is: + ['rugby'] + label is: + ['Rugby'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:21,449 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:21,449 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 154, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:21,450 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:21,450 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:21,450 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:22,392 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:22,424 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:22,455 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:22,485 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:22,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:22,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:22,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:22,609 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:22,640 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:22,670 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:22,980 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5294525623321533 s; generated tokens: 20 tokens; generate speed: 13.076574254453126 tokens/s +2024-07-30 13:57:22,985 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:22,985 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[484/2067], cost time 1.5408s, every example cost time is 1.5408, generate speed: 12.9801 tokens/s, avg speed: 10.7159 tokens/s, remaining time: 0:36:40 +pred is: + ['BSkyB'] + label is: + ['BSkyB'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:23,067 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:23,068 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 235, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:23,068 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:23,068 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:23,069 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:24,012 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:24,045 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:24,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:24,107 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:24,137 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:24,168 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:24,199 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:24,230 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:24,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:24,292 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:24,295 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2257583141326904 s; generated tokens: 10 tokens; generate speed: 8.158215110354522 tokens/s +2024-07-30 13:57:24,299 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:24,300 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[485/2067], cost time 1.2371s, every example cost time is 1.2371, generate speed: 8.0836 tokens/s, avg speed: 10.7111 tokens/s, remaining time: 0:36:39 +pred is: + ['2006'] + label is: + ['2006'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:24,382 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:24,382 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 184, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:24,383 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:24,383 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:24,383 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:25,325 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:25,358 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:25,388 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:25,419 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:25,450 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:25,481 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:25,511 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:25,542 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:25,582 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:25,613 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:25,921 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5378892421722412 s; generated tokens: 20 tokens; generate speed: 13.004837703234308 tokens/s +2024-07-30 13:57:25,926 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:25,926 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[486/2067], cost time 1.5492s, every example cost time is 1.5492, generate speed: 12.9100 tokens/s, avg speed: 10.7161 tokens/s, remaining time: 0:36:38 +pred is: + ['ONdigital'] + label is: + ['ONdigital'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:26,009 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:26,010 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 264, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:26,010 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:26,010 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:26,010 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:26,955 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:26,988 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:27,019 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:27,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:27,081 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:27,111 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:27,142 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:27,173 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:27,204 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:27,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:27,237 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2262310981750488 s; generated tokens: 10 tokens; generate speed: 8.155069639713593 tokens/s +2024-07-30 13:57:27,242 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:27,242 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[487/2067], cost time 1.2374s, every example cost time is 1.2374, generate speed: 8.0815 tokens/s, avg speed: 10.7113 tokens/s, remaining time: 0:36:36 +pred is: + ['Sky+ PVR'] + label is: + ['Sky+ PVR'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:27,325 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:27,325 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 164, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:27,325 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:27,326 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:27,326 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:28,268 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:28,301 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:28,332 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:28,362 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:28,393 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:28,424 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:28,455 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:28,486 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:28,517 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:28,548 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:28,856 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5296037197113037 s; generated tokens: 20 tokens; generate speed: 13.075282010803939 tokens/s +2024-07-30 13:57:28,860 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:28,861 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[488/2067], cost time 1.5409s, every example cost time is 1.5409, generate speed: 12.9790 tokens/s, avg speed: 10.7165 tokens/s, remaining time: 0:36:35 +pred is: + ['VideoGuard'] + label is: + ['VideoGuard'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:28,944 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:28,944 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 169, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:28,945 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:28,945 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:28,945 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:29,888 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:29,921 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:29,952 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:29,983 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:29,985 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0401983261108398 s; generated tokens: 4 tokens; generate speed: 3.8454205314437067 tokens/s +2024-07-30 13:57:29,990 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:29,990 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[489/2067], cost time 1.0520s, every example cost time is 1.0520, generate speed: 3.8024 tokens/s, avg speed: 10.7058 tokens/s, remaining time: 0:36:32 +pred is: + ['Basic channels'] + label is: + ['basic channels'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:30,073 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:30,073 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 200, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:30,074 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:30,074 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:30,074 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:31,017 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:31,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:31,081 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:31,112 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:31,142 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:31,173 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:31,204 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:31,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:31,265 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:31,296 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:31,603 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5286476612091064 s; generated tokens: 20 tokens; generate speed: 13.083459653600428 tokens/s +2024-07-30 13:57:31,608 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:31,608 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[490/2067], cost time 1.5398s, every example cost time is 1.5398, generate speed: 12.9890 tokens/s, avg speed: 10.7109 tokens/s, remaining time: 0:36:31 +pred is: + ['2013'] + label is: + ['July 2013'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +F1 score: 65.56010818182854, Em score: 53.06122448979592, current_count: 490 +2024-07-30 13:57:31,811 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:31,812 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 271, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:31,812 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:31,812 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:31,812 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:32,757 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:32,790 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:32,821 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:32,851 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:32,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:32,913 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:32,943 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:32,974 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:33,005 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:33,035 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:33,129 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3168070316314697 s; generated tokens: 13 tokens; generate speed: 9.872365265162303 tokens/s +2024-07-30 13:57:33,134 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:33,134 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[491/2067], cost time 1.3282s, every example cost time is 1.3282, generate speed: 9.7876 tokens/s, avg speed: 10.7091 tokens/s, remaining time: 0:36:30 +pred is: + ['Sam Chisholm'] + label is: + ['Sam Chisholm'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:33,223 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:33,223 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 146, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:33,223 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:33,224 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:33,224 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:34,167 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:34,198 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:34,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:34,260 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:34,290 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:34,293 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.068993091583252 s; generated tokens: 5 tokens; generate speed: 4.677298702271927 tokens/s +2024-07-30 13:57:34,298 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:34,298 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[492/2067], cost time 1.0805s, every example cost time is 1.0805, generate speed: 4.6277 tokens/s, avg speed: 10.6995 tokens/s, remaining time: 0:36:27 +pred is: + ['British Sky Broadcasting'] + label is: + ['BSkyB'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:57:34,380 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:34,381 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 215, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:34,381 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:34,381 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:34,382 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:35,325 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:35,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:35,388 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:35,419 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:35,450 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:35,481 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:35,511 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:35,542 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:35,573 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:35,604 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:35,881 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4990887641906738 s; generated tokens: 19 tokens; generate speed: 12.674366224242696 tokens/s +2024-07-30 13:57:35,886 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:35,886 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[493/2067], cost time 1.5103s, every example cost time is 1.5103, generate speed: 12.5807 tokens/s, avg speed: 10.7037 tokens/s, remaining time: 0:36:26 +pred is: + ['Sky Q Hub'] + label is: + ['Sky Q Hub'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:35,968 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:35,968 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 170, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:35,969 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:35,969 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:35,969 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:36,912 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:36,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:36,975 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:37,005 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:37,036 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:37,067 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:37,097 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:37,128 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:37,131 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.161585807800293 s; generated tokens: 8 tokens; generate speed: 6.887136487273104 tokens/s +2024-07-30 13:57:37,136 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:37,136 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[494/2067], cost time 1.1726s, every example cost time is 1.1726, generate speed: 6.8222 tokens/s, avg speed: 10.6970 tokens/s, remaining time: 0:36:24 +pred is: + ['DVB-compliant MPEG-2'] + label is: + ['DVB-compliant MPEG-2'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:37,218 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:37,219 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 192, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:37,219 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:37,219 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:37,219 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:38,163 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:38,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:38,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:38,257 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:38,288 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:38,319 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:38,349 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:38,387 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:38,418 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:38,449 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:38,756 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.536057949066162 s; generated tokens: 20 tokens; generate speed: 13.020342111545263 tokens/s +2024-07-30 13:57:38,761 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:38,761 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[495/2067], cost time 1.5473s, every example cost time is 1.5473, generate speed: 12.9254 tokens/s, avg speed: 10.7020 tokens/s, remaining time: 0:36:24 +pred is: + ['1998'] + label is: + ['1998'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:38,843 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:38,843 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 208, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:38,844 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:38,844 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:38,844 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:39,788 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:39,820 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:39,851 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:39,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:39,913 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:39,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:39,974 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:39,977 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1329278945922852 s; generated tokens: 7 tokens; generate speed: 6.178680949963845 tokens/s +2024-07-30 13:57:39,982 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:39,982 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[496/2067], cost time 1.1440s, every example cost time is 1.1440, generate speed: 6.1187 tokens/s, avg speed: 10.6944 tokens/s, remaining time: 0:36:21 +pred is: + ['22 May 2006'] + label is: + ['22 May 2006'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:40,064 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:40,064 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 198, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:40,065 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:40,065 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:40,065 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:41,008 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:41,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:41,073 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:41,104 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:41,135 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:41,166 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:41,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:41,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:41,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:41,289 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:41,352 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.286865472793579 s; generated tokens: 12 tokens; generate speed: 9.324984043553457 tokens/s +2024-07-30 13:57:41,357 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:41,357 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[497/2067], cost time 1.2980s, every example cost time is 1.2980, generate speed: 9.2451 tokens/s, avg speed: 10.6917 tokens/s, remaining time: 0:36:20 +pred is: + ['8 February 2007'] + label is: + ['8 February 2007'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:41,439 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:41,439 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 210, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:41,440 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:41,440 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:41,440 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:42,383 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:42,416 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:42,447 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:42,478 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:42,508 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:42,511 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0707905292510986 s; generated tokens: 5 tokens; generate speed: 4.669447350731572 tokens/s +2024-07-30 13:57:42,516 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:42,516 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[498/2067], cost time 1.0819s, every example cost time is 1.0819, generate speed: 4.6214 tokens/s, avg speed: 10.6822 tokens/s, remaining time: 0:36:17 +pred is: + ['Free-to-view'] + label is: + ['free-to-view'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:42,598 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:42,598 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 316, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:42,599 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:42,599 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:42,599 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:43,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:43,575 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:43,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:43,637 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:43,668 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:43,699 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:43,729 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:43,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:43,763 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1639149188995361 s; generated tokens: 8 tokens; generate speed: 6.873354632797282 tokens/s +2024-07-30 13:57:43,768 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:43,768 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[499/2067], cost time 1.1749s, every example cost time is 1.1749, generate speed: 6.8089 tokens/s, avg speed: 10.6756 tokens/s, remaining time: 0:36:15 +pred is: + ['Autumn of 1991'] + label is: + ['1991'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +2024-07-30 13:57:43,860 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:43,860 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 187, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:43,861 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:43,861 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:43,861 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:44,805 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:44,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:44,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:44,899 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:44,929 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:44,960 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:44,990 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:45,021 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:45,024 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1622381210327148 s; generated tokens: 8 tokens; generate speed: 6.883271039923853 tokens/s +2024-07-30 13:57:45,028 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:45,029 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[500/2067], cost time 1.1738s, every example cost time is 1.1738, generate speed: 6.8155 tokens/s, avg speed: 10.6691 tokens/s, remaining time: 0:36:13 +pred is: + ['Ofcom'] + label is: + ['Ofcom'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 65.91557268485862, Em score: 53.6, current_count: 500 +2024-07-30 13:57:45,233 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:45,233 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 194, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:45,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:45,234 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:45,234 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:46,177 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:46,209 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:46,240 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:46,270 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:46,301 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:46,332 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:46,363 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:46,394 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:46,424 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:46,455 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:46,766 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5314509868621826 s; generated tokens: 20 tokens; generate speed: 13.059510341221143 tokens/s +2024-07-30 13:57:46,770 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:46,771 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[501/2067], cost time 1.5427s, every example cost time is 1.5427, generate speed: 12.9639 tokens/s, avg speed: 10.6742 tokens/s, remaining time: 0:36:12 +pred is: + ['1 October 1998'] + label is: + ['1 October 1998'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:46,853 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:46,853 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 210, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:46,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:46,854 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:46,854 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:47,797 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:47,830 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:47,861 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:47,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:47,922 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:47,953 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:47,984 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:48,015 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:48,045 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:48,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:48,109 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2547261714935303 s; generated tokens: 11 tokens; generate speed: 8.766853079111627 tokens/s +2024-07-30 13:57:48,114 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:48,114 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[502/2067], cost time 1.2659s, every example cost time is 1.2659, generate speed: 8.6894 tokens/s, avg speed: 10.6706 tokens/s, remaining time: 0:36:11 +pred is: + ['2007'] + label is: + ['2007'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:48,196 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:48,196 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 179, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:48,197 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:48,197 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:48,197 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:49,140 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:49,175 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:49,207 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:49,238 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:49,268 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:49,299 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:49,330 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:49,360 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:49,391 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:49,422 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:49,730 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5326786041259766 s; generated tokens: 20 tokens; generate speed: 13.04905017017914 tokens/s +2024-07-30 13:57:49,735 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:49,735 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[503/2067], cost time 1.5439s, every example cost time is 1.5439, generate speed: 12.9542 tokens/s, avg speed: 10.6756 tokens/s, remaining time: 0:36:10 +pred is: + ['10'] + label is: + ['10 million'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:57:49,818 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:49,818 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 194, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:49,818 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:49,819 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:49,819 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:50,762 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:50,794 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:50,825 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:50,856 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:50,887 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:50,918 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:50,948 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:50,979 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:51,010 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:51,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:51,351 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.531691312789917 s; generated tokens: 20 tokens; generate speed: 13.057461273688865 tokens/s +2024-07-30 13:57:51,355 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:51,356 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[504/2067], cost time 1.5430s, every example cost time is 1.5430, generate speed: 12.9620 tokens/s, avg speed: 10.6807 tokens/s, remaining time: 0:36:09 +pred is: + ['A Welfare Cash Card'] + label is: + ['Welfare Cash Card'] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +2024-07-30 13:57:51,438 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:51,438 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 145, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:51,439 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:51,439 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:51,439 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:52,382 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:52,413 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:52,444 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:52,475 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:52,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:52,508 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0686712265014648 s; generated tokens: 5 tokens; generate speed: 4.678707422832579 tokens/s +2024-07-30 13:57:52,513 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:52,513 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[505/2067], cost time 1.0797s, every example cost time is 1.0797, generate speed: 4.6309 tokens/s, avg speed: 10.6714 tokens/s, remaining time: 0:36:06 +pred is: + ['£30m'] + label is: + ['£30m'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:52,595 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:52,596 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 243, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:52,596 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:52,596 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:52,596 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:53,540 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:53,573 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:53,604 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:53,635 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:53,665 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:53,696 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:53,726 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:53,757 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:53,788 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:53,818 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:54,133 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.536525011062622 s; generated tokens: 20 tokens; generate speed: 13.016384280115625 tokens/s +2024-07-30 13:57:54,138 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:54,138 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[506/2067], cost time 1.5477s, every example cost time is 1.5477, generate speed: 12.9226 tokens/s, avg speed: 10.6763 tokens/s, remaining time: 0:36:06 +pred is: + ['1'] + label is: + ['diversified'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:57:54,220 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:54,220 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 172, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:54,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:54,221 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:54,221 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:55,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:55,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:55,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:55,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:55,289 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:55,319 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:55,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:55,381 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:55,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:55,442 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:55,750 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5281524658203125 s; generated tokens: 20 tokens; generate speed: 13.087699328001278 tokens/s +2024-07-30 13:57:55,755 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:55,755 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[507/2067], cost time 1.5393s, every example cost time is 1.5393, generate speed: 12.9931 tokens/s, avg speed: 10.6814 tokens/s, remaining time: 0:36:05 +pred is: + ['1'] + label is: + ['Bendigo'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:57:55,837 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:55,837 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:55,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:55,838 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:55,838 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:56,781 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:56,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:56,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:56,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:56,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:56,937 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:56,940 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1019456386566162 s; generated tokens: 6 tokens; generate speed: 5.444914694081107 tokens/s +2024-07-30 13:57:56,945 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:56,945 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[508/2067], cost time 1.1131s, every example cost time is 1.1131, generate speed: 5.3903 tokens/s, avg speed: 10.6730 tokens/s, remaining time: 0:36:02 +pred is: + ['Proportional Representation'] + label is: + ['multi-member proportional'] +The F1/Em of this example is: {'F1': 33.33333333333333, 'Em': 0.0} +2024-07-30 13:57:57,028 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:57,029 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 178, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:57,029 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:57,029 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:57,030 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:57,973 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:58,006 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:58,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:58,068 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:58,098 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:58,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:58,160 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:58,191 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:58,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:58,252 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:58,559 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5294654369354248 s; generated tokens: 20 tokens; generate speed: 13.07646417958539 tokens/s +2024-07-30 13:57:58,564 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:58,564 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[509/2067], cost time 1.5413s, every example cost time is 1.5413, generate speed: 12.9764 tokens/s, avg speed: 10.6781 tokens/s, remaining time: 0:36:01 +pred is: + ['Australian Labor Party'] + label is: + ['Australian Labor Party'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:57:58,647 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:58,647 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:58,648 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:58,648 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:58,648 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:57:59,591 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:59,624 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:59,656 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:59,688 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:59,719 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:59,722 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.073831558227539 s; generated tokens: 5 tokens; generate speed: 4.656223745419602 tokens/s +2024-07-30 13:57:59,727 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:57:59,727 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[510/2067], cost time 1.0850s, every example cost time is 1.0850, generate speed: 4.6084 tokens/s, avg speed: 10.6688 tokens/s, remaining time: 0:35:59 +pred is: + ['61.1'] + label is: + ['61.1%'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 65.7342215864627, Em score: 53.333333333333336, current_count: 510 +2024-07-30 13:57:59,934 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:57:59,934 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 162, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:57:59,934 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:57:59,935 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:57:59,935 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:00,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:00,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:00,941 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:00,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:01,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:01,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:01,063 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:01,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:01,124 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:01,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:01,462 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5269725322723389 s; generated tokens: 20 tokens; generate speed: 13.097812552159882 tokens/s +2024-07-30 13:58:01,467 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:01,467 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[511/2067], cost time 1.5384s, every example cost time is 1.5384, generate speed: 13.0006 tokens/s, avg speed: 10.6738 tokens/s, remaining time: 0:35:58 +pred is: + ['South-east'] + label is: + ['south-east'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:58:01,550 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:01,550 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 268, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:01,551 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:01,551 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:01,551 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:02,495 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:02,527 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:02,558 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:02,589 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:02,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:02,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:02,681 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:02,712 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:02,743 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:02,774 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:03,085 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5334599018096924 s; generated tokens: 20 tokens; generate speed: 13.042401680276912 tokens/s +2024-07-30 13:58:03,091 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:03,091 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[512/2067], cost time 1.5454s, every example cost time is 1.5454, generate speed: 12.9412 tokens/s, avg speed: 10.6787 tokens/s, remaining time: 0:35:57 +pred is: + ['Koori'] + label is: + ['Koori'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:58:03,182 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:03,182 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 218, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:03,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:03,183 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:03,183 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:04,127 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:04,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:04,190 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:04,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:04,252 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:04,283 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:04,314 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:04,345 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:04,376 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:04,407 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:04,625 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4412422180175781 s; generated tokens: 17 tokens; generate speed: 11.795380254252764 tokens/s +2024-07-30 13:58:04,630 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:04,630 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[513/2067], cost time 1.4529s, every example cost time is 1.4529, generate speed: 11.7006 tokens/s, avg speed: 10.6808 tokens/s, remaining time: 0:35:56 +pred is: + ['More than 26,000 square kilometres (10,000 sq mi)'] + label is: + ['26,000 square kilometres'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:58:04,713 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:04,714 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 155, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:04,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:04,714 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:04,714 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:05,657 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:05,689 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:05,721 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:05,751 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:05,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:05,813 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:05,844 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:05,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:05,905 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:05,936 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:06,122 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4075589179992676 s; generated tokens: 16 tokens; generate speed: 11.367197348117207 tokens/s +2024-07-30 13:58:06,127 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:06,127 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[514/2067], cost time 1.4188s, every example cost time is 1.4188, generate speed: 11.2768 tokens/s, avg speed: 10.6820 tokens/s, remaining time: 0:35:55 +pred is: + ['1975'] + label is: + ['1975'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:58:06,211 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:06,211 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 184, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:06,211 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:06,212 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:06,212 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:07,154 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:07,187 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:07,218 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:07,221 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0093581676483154 s; generated tokens: 3 tokens; generate speed: 2.97218578712217 tokens/s +2024-07-30 13:58:07,226 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:07,226 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[515/2067], cost time 1.0207s, every example cost time is 1.0207, generate speed: 2.9391 tokens/s, avg speed: 10.6710 tokens/s, remaining time: 0:35:52 +pred is: + ['Hot'] + label is: + ['warmest regions'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:58:07,309 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:07,309 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 229, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:07,309 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:07,310 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:07,310 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:08,253 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:08,286 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:08,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:08,348 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:08,378 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:08,409 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:08,440 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:08,471 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:08,502 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:08,533 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:08,567 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2565991878509521 s; generated tokens: 11 tokens; generate speed: 8.753785699012193 tokens/s +2024-07-30 13:58:08,571 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:08,572 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[516/2067], cost time 1.2678s, every example cost time is 1.2678, generate speed: 8.6766 tokens/s, avg speed: 10.6674 tokens/s, remaining time: 0:35:51 +pred is: + ['Public schools'] + label is: + ['state or government'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 13:58:08,654 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:08,654 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:08,655 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:08,655 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:08,655 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:09,598 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:09,631 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:09,662 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:09,693 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:09,724 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:09,727 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.071746826171875 s; generated tokens: 5 tokens; generate speed: 4.665280902075799 tokens/s +2024-07-30 13:58:09,732 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:09,732 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[517/2067], cost time 1.0830s, every example cost time is 1.0830, generate speed: 4.6167 tokens/s, avg speed: 10.6583 tokens/s, remaining time: 0:35:48 +pred is: + ['Car manufacturing plant'] + label is: + ['major car brands'] +The F1/Em of this example is: {'F1': 40.00000000000001, 'Em': 0.0} +2024-07-30 13:58:09,815 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:09,816 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 264, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:09,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:09,816 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:09,816 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:10,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:10,792 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:10,823 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:10,863 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:10,895 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:10,925 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:10,956 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:10,987 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:11,018 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:11,049 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:11,360 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5437955856323242 s; generated tokens: 20 tokens; generate speed: 12.955083034395507 tokens/s +2024-07-30 13:58:11,365 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:11,366 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[518/2067], cost time 1.5552s, every example cost time is 1.5552, generate speed: 12.8603 tokens/s, avg speed: 10.6630 tokens/s, remaining time: 0:35:47 +pred is: + ['1960'] + label is: + ['2,000 m'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:58:11,448 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:11,448 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 176, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:11,449 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:11,449 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:11,449 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:12,392 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:12,425 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:12,456 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:12,487 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:12,517 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:12,548 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:12,579 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:12,609 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:12,640 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:12,671 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:12,855 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4058997631072998 s; generated tokens: 16 tokens; generate speed: 11.380612202847965 tokens/s +2024-07-30 13:58:12,860 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:12,860 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[519/2067], cost time 1.4172s, every example cost time is 1.4172, generate speed: 11.2899 tokens/s, avg speed: 10.6643 tokens/s, remaining time: 0:35:46 +pred is: + ['The Victorian Alps in the northeast are the coldest part of Victoria.'] + label is: + ['Victorian Alps'] +The F1/Em of this example is: {'F1': 22.22222222222222, 'Em': 0.0} +2024-07-30 13:58:12,944 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:12,944 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 158, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:12,945 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:12,945 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:12,945 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:13,887 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:13,918 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:13,949 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:13,979 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:14,010 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:14,013 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.067713737487793 s; generated tokens: 5 tokens; generate speed: 4.682903126978981 tokens/s +2024-07-30 13:58:14,017 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:14,018 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[520/2067], cost time 1.0786s, every example cost time is 1.0786, generate speed: 4.6354 tokens/s, avg speed: 10.6553 tokens/s, remaining time: 0:35:44 +pred is: + ['The Victorian Government'] + label is: + ['government-owned'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 65.31091390638115, Em score: 52.88461538461539, current_count: 520 +2024-07-30 13:58:14,228 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:14,228 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 174, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:14,228 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:14,229 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:14,229 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:15,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:15,204 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:15,235 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:15,265 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:15,296 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:15,327 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:15,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:15,388 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:15,419 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:15,423 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1938090324401855 s; generated tokens: 9 tokens; generate speed: 7.538894207898309 tokens/s +2024-07-30 13:58:15,429 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:15,430 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[521/2067], cost time 1.2069s, every example cost time is 1.2069, generate speed: 7.4573 tokens/s, avg speed: 10.6499 tokens/s, remaining time: 0:35:42 +pred is: + ['37'] + label is: + ['37'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:58:15,512 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:15,512 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 226, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:15,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:15,512 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:15,513 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:16,456 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:16,489 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:16,520 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:16,551 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:16,582 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:16,613 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:16,644 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:16,674 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:16,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:16,736 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:17,045 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5326178073883057 s; generated tokens: 20 tokens; generate speed: 13.049567807176587 tokens/s +2024-07-30 13:58:17,050 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:17,051 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[522/2067], cost time 1.5439s, every example cost time is 1.5439, generate speed: 12.9541 tokens/s, avg speed: 10.6548 tokens/s, remaining time: 0:35:41 +pred is: + ['1 July 1851'] + label is: + ['1 July 1851'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:58:17,133 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:17,133 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:17,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:17,134 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:17,134 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:18,077 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:18,111 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:18,142 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:18,173 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:18,205 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:18,236 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:18,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:18,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:18,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:18,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:18,393 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2589457035064697 s; generated tokens: 11 tokens; generate speed: 8.737469748983079 tokens/s +2024-07-30 13:58:18,398 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:18,398 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[523/2067], cost time 1.2701s, every example cost time is 1.2701, generate speed: 8.6610 tokens/s, avg speed: 10.6513 tokens/s, remaining time: 0:35:39 +pred is: + ['1548'] + label is: + ['1,548'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:58:18,481 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:18,482 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 196, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:18,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:18,482 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:18,482 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:19,425 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:19,458 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:19,490 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:19,493 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0104310512542725 s; generated tokens: 3 tokens; generate speed: 2.9690298969692464 tokens/s +2024-07-30 13:58:19,498 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:19,498 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[524/2067], cost time 1.0216s, every example cost time is 1.0216, generate speed: 2.9365 tokens/s, avg speed: 10.6405 tokens/s, remaining time: 0:35:37 +pred is: + ['Victoria'] + label is: + ['Victoria'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:58:19,581 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:19,581 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 174, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:19,581 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:19,582 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:19,582 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:20,529 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:20,562 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:20,593 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:20,624 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:20,655 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:20,686 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:20,716 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:20,747 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:20,778 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:20,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:20,903 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3205835819244385 s; generated tokens: 13 tokens; generate speed: 9.844132683412262 tokens/s +2024-07-30 13:58:20,907 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:20,908 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[525/2067], cost time 1.3318s, every example cost time is 1.3318, generate speed: 9.7609 tokens/s, avg speed: 10.6389 tokens/s, remaining time: 0:35:35 +pred is: + ['1,600 mm (5 ft 3 in)'] + label is: + ['1,600 mm'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:58:20,989 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:20,990 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 230, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:20,990 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:20,990 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:20,991 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:21,934 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:21,966 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:21,997 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:22,028 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:22,059 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:22,089 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:22,120 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:22,151 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:22,182 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:22,213 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:22,522 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5316059589385986 s; generated tokens: 20 tokens; generate speed: 13.05818894427649 tokens/s +2024-07-30 13:58:22,527 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:22,527 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[526/2067], cost time 1.5427s, every example cost time is 1.5427, generate speed: 12.9640 tokens/s, avg speed: 10.6438 tokens/s, remaining time: 0:35:34 +pred is: + ['1788'] + label is: + ['1788'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:58:22,609 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:22,610 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 158, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:22,610 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:22,610 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:22,610 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:23,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:23,586 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:23,617 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:23,648 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:23,679 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:23,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:23,740 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:23,771 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:23,802 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:23,833 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:24,144 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5332114696502686 s; generated tokens: 20 tokens; generate speed: 13.044514990852552 tokens/s +2024-07-30 13:58:24,149 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:24,149 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[527/2067], cost time 1.5443s, every example cost time is 1.5443, generate speed: 12.9509 tokens/s, avg speed: 10.6487 tokens/s, remaining time: 0:35:33 +pred is: + ['1854'] + label is: + ['1854'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:58:24,232 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:24,232 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 145, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:24,232 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:24,233 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:24,233 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:25,175 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:25,208 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:25,239 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:25,270 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:25,301 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:25,332 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:25,362 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:25,393 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:25,424 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:25,455 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:25,763 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5299973487854004 s; generated tokens: 20 tokens; generate speed: 13.07191807611768 tokens/s +2024-07-30 13:58:25,768 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:25,768 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[528/2067], cost time 1.5413s, every example cost time is 1.5413, generate speed: 12.9765 tokens/s, avg speed: 10.6536 tokens/s, remaining time: 0:35:32 +pred is: + ['The Premier of Victoria needs to lead in the Legislative Assembly.'] + label is: + ['most seats'] +The F1/Em of this example is: {'F1': 8.0, 'Em': 0.0} +2024-07-30 13:58:25,852 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:25,852 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 169, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:25,853 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:25,853 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:25,853 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:26,795 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:26,828 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:26,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:26,890 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:26,892 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0389018058776855 s; generated tokens: 4 tokens; generate speed: 3.8502195081090633 tokens/s +2024-07-30 13:58:26,897 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:26,897 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[529/2067], cost time 1.0499s, every example cost time is 1.0499, generate speed: 3.8098 tokens/s, avg speed: 10.6438 tokens/s, remaining time: 0:35:30 +pred is: + ['17%'] + label is: + ['$8.7 billion'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:58:26,985 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:26,986 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 155, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:26,986 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:26,986 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:26,987 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:27,930 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:27,962 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:27,994 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:28,025 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:28,055 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:28,086 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:28,117 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:28,148 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:28,178 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:28,209 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:28,273 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2859575748443604 s; generated tokens: 12 tokens; generate speed: 9.331567568589781 tokens/s +2024-07-30 13:58:28,277 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:28,278 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[530/2067], cost time 1.2974s, every example cost time is 1.2974, generate speed: 9.2494 tokens/s, avg speed: 10.6413 tokens/s, remaining time: 0:35:28 +pred is: + ["Events play a big part in Victoria's economy."] + label is: + ['tourism'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 65.13146270060037, Em score: 52.83018867924528, current_count: 530 +2024-07-30 13:58:28,490 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:28,491 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 179, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:28,491 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:28,491 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:28,491 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:29,434 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:29,466 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:29,497 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:29,541 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:29,572 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:29,603 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:29,634 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:29,665 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:29,668 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1763577461242676 s; generated tokens: 8 tokens; generate speed: 6.800652289966644 tokens/s +2024-07-30 13:58:29,673 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:29,673 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[531/2067], cost time 1.1877s, every example cost time is 1.1877, generate speed: 6.7356 tokens/s, avg speed: 10.6350 tokens/s, remaining time: 0:35:26 +pred is: + ['Southern and central parts of France'] + label is: + ['the southern and central parts of France'] +The F1/Em of this example is: {'F1': 91.66666666666666, 'Em': 0.0} +2024-07-30 13:58:29,756 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:29,756 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 354, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:29,756 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:29,757 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:29,757 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:30,702 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:30,734 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:30,766 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:30,797 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:30,828 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:30,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:30,890 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:30,921 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:30,952 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:30,983 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:30,986 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2291843891143799 s; generated tokens: 10 tokens; generate speed: 8.135475920911215 tokens/s +2024-07-30 13:58:30,991 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:30,991 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[532/2067], cost time 1.2403s, every example cost time is 1.2403, generate speed: 8.0627 tokens/s, avg speed: 10.6307 tokens/s, remaining time: 0:35:25 +pred is: + ['A'] + label is: + ['derision'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:58:31,073 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:31,073 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 150, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:31,073 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:31,074 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:31,074 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:32,015 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:32,048 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:32,079 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:32,110 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:32,140 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:32,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:32,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:32,233 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:32,263 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:32,294 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:32,328 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2541017532348633 s; generated tokens: 11 tokens; generate speed: 8.771218102220422 tokens/s +2024-07-30 13:58:32,333 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:32,333 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[533/2067], cost time 1.2654s, every example cost time is 1.2654, generate speed: 8.6932 tokens/s, avg speed: 10.6273 tokens/s, remaining time: 0:35:23 +pred is: + ['The availability of the Bible in vernacular languages'] + label is: + ['availability of the Bible in vernacular languages'] +The F1/Em of this example is: {'F1': 92.85714285714286, 'Em': 0.0} +2024-07-30 13:58:32,416 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:32,416 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 190, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:32,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:32,417 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:32,417 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:33,360 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:33,393 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:33,426 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:33,457 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:33,487 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:33,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:33,549 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:33,580 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:33,610 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:33,641 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:33,950 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5321934223175049 s; generated tokens: 20 tokens; generate speed: 13.053182260598135 tokens/s +2024-07-30 13:58:33,954 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:33,955 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[534/2067], cost time 1.5434s, every example cost time is 1.5434, generate speed: 12.9586 tokens/s, avg speed: 10.6322 tokens/s, remaining time: 0:35:22 +pred is: + ['66'] + label is: + ['villes de sûreté'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:58:34,037 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:34,037 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 249, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:34,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:34,038 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:34,038 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:34,982 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:35,015 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:35,046 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:35,078 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:35,109 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:35,140 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:35,170 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:35,201 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:35,232 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:35,263 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:35,572 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5339667797088623 s; generated tokens: 20 tokens; generate speed: 13.038092000790186 tokens/s +2024-07-30 13:58:35,577 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:35,577 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[535/2067], cost time 1.5451s, every example cost time is 1.5451, generate speed: 12.9445 tokens/s, avg speed: 10.6370 tokens/s, remaining time: 0:35:21 +pred is: + ['1'] + label is: + ['at the Cape of Good Hope'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:58:35,659 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:35,660 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 274, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:35,660 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:35,660 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:35,660 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:36,605 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:36,643 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:36,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:36,708 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:36,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:36,770 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:36,801 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:36,832 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:36,863 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:36,894 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:36,928 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.267448902130127 s; generated tokens: 11 tokens; generate speed: 8.678850864530276 tokens/s +2024-07-30 13:58:36,933 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:36,933 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[536/2067], cost time 1.2785s, every example cost time is 1.2785, generate speed: 8.6039 tokens/s, avg speed: 10.6335 tokens/s, remaining time: 0:35:19 +pred is: + ['1624'] + label is: + ['1624'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:58:37,016 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:37,016 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 298, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:37,017 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:37,017 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:37,017 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:37,962 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:37,994 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:38,026 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:38,057 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:38,087 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:38,118 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:38,149 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:38,180 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:38,231 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:38,264 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:38,575 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5577664375305176 s; generated tokens: 20 tokens; generate speed: 12.838895175906746 tokens/s +2024-07-30 13:58:38,580 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:38,580 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[537/2067], cost time 1.5690s, every example cost time is 1.5690, generate speed: 12.7470 tokens/s, avg speed: 10.6380 tokens/s, remaining time: 0:35:19 +pred is: + ['1'] + label is: + ['the Charleston Orange district'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:58:38,662 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:38,663 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 155, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:38,663 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:38,663 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:38,664 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:39,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:39,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:39,671 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:39,703 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:39,734 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:39,765 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:39,796 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:39,827 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:39,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:39,889 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:40,199 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5348351001739502 s; generated tokens: 20 tokens; generate speed: 13.030715806364674 tokens/s +2024-07-30 13:58:40,203 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:40,204 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[538/2067], cost time 1.5460s, every example cost time is 1.5460, generate speed: 12.9369 tokens/s, avg speed: 10.6427 tokens/s, remaining time: 0:35:18 +pred is: + ['William III of Orange'] + label is: + ['William III of Orange'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:58:40,286 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:40,287 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 171, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:40,287 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:40,287 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:40,288 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:41,230 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:41,263 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:41,294 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:41,325 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:41,356 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:41,387 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:41,418 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:41,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:41,479 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:41,482 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.194033145904541 s; generated tokens: 9 tokens; generate speed: 7.537479198855942 tokens/s +2024-07-30 13:58:41,486 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:41,487 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[539/2067], cost time 1.2051s, every example cost time is 1.2051, generate speed: 7.4683 tokens/s, avg speed: 10.6376 tokens/s, remaining time: 0:35:16 +pred is: + ['Edict of Fontainebleau'] + label is: + ['Edict of Fontainebleau'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:58:41,569 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:41,569 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 166, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:41,570 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:41,570 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:41,570 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:42,513 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:42,546 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:42,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:42,610 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:42,641 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:42,671 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:42,702 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:42,733 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:42,763 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:42,794 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:43,102 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5317323207855225 s; generated tokens: 20 tokens; generate speed: 13.0571116954321 tokens/s +2024-07-30 13:58:43,107 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:43,107 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[540/2067], cost time 1.5429s, every example cost time is 1.5429, generate speed: 12.9630 tokens/s, avg speed: 10.6424 tokens/s, remaining time: 0:35:15 +pred is: + ['The Catholic Church in France and many of its members opposed the Huguenots.'] + label is: + ['Catholic Church in France'] +The F1/Em of this example is: {'F1': 42.42424242424242, 'Em': 0.0} +F1 score: 64.90115422827083, Em score: 52.407407407407405, current_count: 540 +2024-07-30 13:58:43,325 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:43,325 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 216, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:43,326 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:43,326 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:43,326 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:44,269 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:44,301 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:44,332 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:44,362 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:44,393 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:44,424 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:44,455 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:44,486 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:44,517 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:44,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:44,722 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3960695266723633 s; generated tokens: 15 tokens; generate speed: 10.744450554517602 tokens/s +2024-07-30 13:58:44,727 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:44,727 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[541/2067], cost time 1.4073s, every example cost time is 1.4073, generate speed: 10.6589 tokens/s, avg speed: 10.6425 tokens/s, remaining time: 0:35:13 +pred is: + ['1621-1629'] + label is: + ['between 1621 and 1629'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:58:44,809 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:44,810 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 159, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:44,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:44,810 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:44,810 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:45,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:45,786 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:45,818 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:45,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:45,881 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:45,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:45,914 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1035408973693848 s; generated tokens: 6 tokens; generate speed: 5.437043624121924 tokens/s +2024-07-30 13:58:45,919 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:45,919 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[542/2067], cost time 1.1145s, every example cost time is 1.1145, generate speed: 5.3834 tokens/s, avg speed: 10.6346 tokens/s, remaining time: 0:35:11 +pred is: + ['Approximately one million'] + label is: + ['one million'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 13:58:46,002 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:46,002 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 190, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:46,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:46,003 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:46,003 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:46,945 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:46,978 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:47,009 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:47,041 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:47,089 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:47,092 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.088761329650879 s; generated tokens: 5 tokens; generate speed: 4.592374714119663 tokens/s +2024-07-30 13:58:47,097 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:47,097 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[543/2067], cost time 1.0999s, every example cost time is 1.0999, generate speed: 4.5459 tokens/s, avg speed: 10.6257 tokens/s, remaining time: 0:35:09 +pred is: + ['New Rochelle'] + label is: + ['New Rochelle'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:58:47,178 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:47,179 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 229, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:47,179 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:47,179 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:47,180 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:48,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:48,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:48,187 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:48,218 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:48,248 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:48,251 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0717365741729736 s; generated tokens: 5 tokens; generate speed: 4.665325529137929 tokens/s +2024-07-30 13:58:48,256 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:48,256 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[544/2067], cost time 1.0828s, every example cost time is 1.0828, generate speed: 4.6178 tokens/s, avg speed: 10.6171 tokens/s, remaining time: 0:35:07 +pred is: + ['Dutch Republic'] + label is: + ['the Dutch Republic'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 13:58:48,339 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:48,339 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 219, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:48,339 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:48,340 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:48,340 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:49,283 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:49,316 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:49,347 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:49,377 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:49,409 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:49,443 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:49,474 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:49,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:49,536 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:49,602 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:49,914 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5738027095794678 s; generated tokens: 20 tokens; generate speed: 12.708073177319763 tokens/s +2024-07-30 13:58:49,919 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:49,919 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[545/2067], cost time 1.5850s, every example cost time is 1.5850, generate speed: 12.6187 tokens/s, avg speed: 10.6213 tokens/s, remaining time: 0:35:06 +pred is: + ['Tours'] + label is: + ['Tours'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:58:50,001 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:50,001 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 240, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:50,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:50,002 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:50,002 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:50,946 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:50,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:51,008 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:51,039 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:51,070 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:51,101 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:51,132 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:51,163 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:51,193 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:51,224 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:51,534 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.531419038772583 s; generated tokens: 20 tokens; generate speed: 13.059782785533214 tokens/s +2024-07-30 13:58:51,538 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:51,539 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[546/2067], cost time 1.5426s, every example cost time is 1.5426, generate speed: 12.9652 tokens/s, avg speed: 10.6261 tokens/s, remaining time: 0:35:05 +pred is: + ['Canterbury'] + label is: + ['Canterbury'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:58:51,621 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:51,621 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 199, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:51,621 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:51,622 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:51,622 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:52,564 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:52,596 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:52,627 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:52,658 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:52,661 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0387423038482666 s; generated tokens: 4 tokens; generate speed: 3.8508107209854203 tokens/s +2024-07-30 13:58:52,665 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:52,666 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[547/2067], cost time 1.0497s, every example cost time is 1.0497, generate speed: 3.8108 tokens/s, avg speed: 10.6166 tokens/s, remaining time: 0:35:03 +pred is: + ['Cork'] + label is: + ['Cork City'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:58:52,747 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:52,747 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 196, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:52,748 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:52,748 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:52,748 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:53,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:53,723 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:53,754 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:53,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:53,788 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.039529800415039 s; generated tokens: 4 tokens; generate speed: 3.8478935364844506 tokens/s +2024-07-30 13:58:53,793 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:53,793 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[548/2067], cost time 1.0505s, every example cost time is 1.0505, generate speed: 3.8079 tokens/s, avg speed: 10.6072 tokens/s, remaining time: 0:35:01 +pred is: + ['Brain drain'] + label is: + ['brain drain'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:58:53,875 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:53,875 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 179, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:53,875 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:53,876 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:53,876 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:54,818 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:54,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:54,881 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:54,912 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:54,943 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:54,974 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:55,005 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:55,007 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.131368637084961 s; generated tokens: 7 tokens; generate speed: 6.18719643672987 tokens/s +2024-07-30 13:58:55,012 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:55,012 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[549/2067], cost time 1.1423s, every example cost time is 1.1423, generate speed: 6.1278 tokens/s, avg speed: 10.6005 tokens/s, remaining time: 0:34:58 +pred is: + ['Henry of Navarre'] + label is: + ['Henry of Navarre'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:58:55,094 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:55,094 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 198, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:55,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:55,095 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:55,095 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:56,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:56,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:56,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:56,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:56,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:56,187 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0915532112121582 s; generated tokens: 5 tokens; generate speed: 4.580628730364462 tokens/s +2024-07-30 13:58:56,191 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:56,191 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[550/2067], cost time 1.1026s, every example cost time is 1.1026, generate speed: 4.5347 tokens/s, avg speed: 10.5917 tokens/s, remaining time: 0:34:56 +pred is: + ['Education as Catholics'] + label is: + ['education of children as Catholics'] +The F1/Em of this example is: {'F1': 57.14285714285714, 'Em': 0.0} +F1 score: 65.09775661892564, Em score: 52.36363636363637, current_count: 550 +2024-07-30 13:58:56,410 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:56,410 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 277, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:56,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:56,411 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:56,411 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:57,355 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:57,386 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:57,418 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:57,449 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:57,480 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:57,511 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:57,542 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:57,573 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:57,604 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:57,635 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:57,967 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5557711124420166 s; generated tokens: 20 tokens; generate speed: 12.855361460341678 tokens/s +2024-07-30 13:58:57,972 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:57,972 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[551/2067], cost time 1.5671s, every example cost time is 1.5671, generate speed: 12.7623 tokens/s, avg speed: 10.5961 tokens/s, remaining time: 0:34:55 +pred is: + ['Switzerland and the Netherlands'] + label is: + ['Switzerland and the Netherlands'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:58:58,055 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:58,055 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 345, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:58,055 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:58,056 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:58,056 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:58:59,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:59,035 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:59,066 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:59,097 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:59,128 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:59,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:59,190 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:59,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:59,252 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:59,283 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:59,286 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.230100393295288 s; generated tokens: 10 tokens; generate speed: 8.129417773139009 tokens/s +2024-07-30 13:58:59,291 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:58:59,291 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[552/2067], cost time 1.2412s, every example cost time is 1.2412, generate speed: 8.0565 tokens/s, avg speed: 10.5920 tokens/s, remaining time: 0:34:54 +pred is: + ['Afrikaans'] + label is: + ['Afrikaans'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:58:59,374 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:58:59,374 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 205, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:58:59,375 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:58:59,375 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:58:59,375 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:00,318 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:00,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:00,413 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:00,445 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:00,476 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:00,507 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:00,538 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:00,568 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:00,600 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:00,630 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:00,633 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2579946517944336 s; generated tokens: 10 tokens; generate speed: 7.949159390889112 tokens/s +2024-07-30 13:59:00,638 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:00,638 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[553/2067], cost time 1.2692s, every example cost time is 1.2692, generate speed: 7.8793 tokens/s, avg speed: 10.5875 tokens/s, remaining time: 0:34:52 +pred is: + ['Paul Revere'] + label is: + ['Paul Revere'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:59:00,720 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:00,720 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 232, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:00,721 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:00,721 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:00,721 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:01,665 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:01,698 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:01,729 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:01,759 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:01,790 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:01,821 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:01,851 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:01,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:01,913 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:01,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:02,252 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5309364795684814 s; generated tokens: 20 tokens; generate speed: 13.06389929753148 tokens/s +2024-07-30 13:59:02,257 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:02,257 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[554/2067], cost time 1.5421s, every example cost time is 1.5421, generate speed: 12.9695 tokens/s, avg speed: 10.5923 tokens/s, remaining time: 0:34:51 +pred is: + ['Lace'] + label is: + ['lace'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:59:02,340 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:02,340 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 176, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:02,340 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:02,341 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:02,341 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:03,284 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:03,316 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:03,347 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:03,378 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:03,409 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:03,440 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:03,470 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:03,501 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:03,532 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:03,563 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:03,566 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2248713970184326 s; generated tokens: 10 tokens; generate speed: 8.164122392229814 tokens/s +2024-07-30 13:59:03,571 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:03,571 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[555/2067], cost time 1.2361s, every example cost time is 1.2361, generate speed: 8.0900 tokens/s, avg speed: 10.5882 tokens/s, remaining time: 0:34:49 +pred is: + ['Dorotheenstadt and Friedrichstadt'] + label is: + ['Dorotheenstadt and Friedrichstadt'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:59:03,654 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:03,654 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 214, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:03,654 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:03,655 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:03,655 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:04,598 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:04,630 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:04,661 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:04,692 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:04,722 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:04,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:04,784 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:04,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:04,817 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1619994640350342 s; generated tokens: 8 tokens; generate speed: 6.884684758992971 tokens/s +2024-07-30 13:59:04,822 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:04,822 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[556/2067], cost time 1.1731s, every example cost time is 1.1731, generate speed: 6.8197 tokens/s, avg speed: 10.5825 tokens/s, remaining time: 0:34:47 +pred is: + ['Prussia'] + label is: + ['Prussia'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:59:04,904 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:04,904 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 211, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:04,905 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:04,905 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:04,905 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:05,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:05,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:05,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:05,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:05,943 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0376935005187988 s; generated tokens: 4 tokens; generate speed: 3.8547027595337013 tokens/s +2024-07-30 13:59:05,948 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:05,948 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[557/2067], cost time 1.0485s, every example cost time is 1.0485, generate speed: 3.8150 tokens/s, avg speed: 10.5733 tokens/s, remaining time: 0:34:45 +pred is: + ['Jacksonville'] + label is: + ['Jacksonville'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:59:06,030 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:06,030 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 240, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:06,031 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:06,059 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:06,059 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:07,004 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:07,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:07,068 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:07,099 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:07,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:07,160 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:07,191 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:07,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:07,252 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:07,283 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:07,286 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2266473770141602 s; generated tokens: 10 tokens; generate speed: 8.152302110115352 tokens/s +2024-07-30 13:59:07,291 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:07,291 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[558/2067], cost time 1.2656s, every example cost time is 1.2656, generate speed: 7.9014 tokens/s, avg speed: 10.5689 tokens/s, remaining time: 0:34:43 +pred is: + ['Charlesfort'] + label is: + ['Charlesfort'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:59:07,373 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:07,373 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 304, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:07,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:07,374 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:07,374 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:08,318 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:08,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:08,383 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:08,414 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:08,444 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:08,475 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:08,506 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:08,537 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:08,587 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:08,618 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:08,621 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.246600866317749 s; generated tokens: 10 tokens; generate speed: 8.021813773913323 tokens/s +2024-07-30 13:59:08,625 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:08,626 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[559/2067], cost time 1.2578s, every example cost time is 1.2578, generate speed: 7.9505 tokens/s, avg speed: 10.5646 tokens/s, remaining time: 0:34:42 +pred is: + ['Virginia'] + label is: + ['Virginia'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:59:08,708 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:08,709 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 316, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:08,709 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:08,709 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:08,709 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:09,655 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:09,688 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:09,719 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:09,751 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:09,781 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:09,812 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:09,843 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:09,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:09,905 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:09,936 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:10,061 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.351513147354126 s; generated tokens: 14 tokens; generate speed: 10.3587597556176 tokens/s +2024-07-30 13:59:10,066 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:10,066 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[560/2067], cost time 1.3627s, every example cost time is 1.3627, generate speed: 10.2740 tokens/s, avg speed: 10.5641 tokens/s, remaining time: 0:34:40 +pred is: + ['1568–1609'] + label is: + ['1568–1609'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 65.72101096501626, Em score: 53.214285714285715, current_count: 560 +2024-07-30 13:59:10,288 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:10,288 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 171, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:10,289 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:10,289 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:10,289 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:11,231 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:11,263 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:11,294 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:11,325 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:11,356 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:11,386 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:11,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:11,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:11,478 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:11,509 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:11,816 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5270426273345947 s; generated tokens: 20 tokens; generate speed: 13.097211329921665 tokens/s +2024-07-30 13:59:11,821 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:11,821 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[561/2067], cost time 1.5384s, every example cost time is 1.5384, generate speed: 13.0008 tokens/s, avg speed: 10.5689 tokens/s, remaining time: 0:34:39 +pred is: + ['Foreign Protestants Naturalization Act'] + label is: + ['Foreign Protestants Naturalization Act'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:59:11,904 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:11,904 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 193, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:11,905 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:11,905 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:11,905 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:12,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:12,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:12,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:12,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:12,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:13,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:13,034 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:13,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:13,095 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:13,126 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:13,433 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.527482509613037 s; generated tokens: 20 tokens; generate speed: 13.09343961330639 tokens/s +2024-07-30 13:59:13,438 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:13,438 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[562/2067], cost time 1.5386s, every example cost time is 1.5386, generate speed: 12.9990 tokens/s, avg speed: 10.5738 tokens/s, remaining time: 0:34:38 +pred is: + ['Williamite war in Ireland'] + label is: + ['Williamite war'] +The F1/Em of this example is: {'F1': 60.0, 'Em': 0.0} +2024-07-30 13:59:13,520 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:13,521 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 205, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:13,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:13,521 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:13,522 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:14,464 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:14,497 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:14,528 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:14,558 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:14,589 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:14,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:14,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:14,682 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:14,712 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:14,743 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:14,961 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.43906569480896 s; generated tokens: 17 tokens; generate speed: 11.813220245137453 tokens/s +2024-07-30 13:59:14,966 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:14,966 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[563/2067], cost time 1.4502s, every example cost time is 1.4502, generate speed: 11.7226 tokens/s, avg speed: 10.5759 tokens/s, remaining time: 0:34:37 +pred is: + ['Count Ludwig von Nassau-Saarbrücken'] + label is: + ['Prince Louis de Condé'] +The F1/Em of this example is: {'F1': 11.76470588235294, 'Em': 0.0} +2024-07-30 13:59:15,049 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:15,050 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:15,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:15,050 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:15,050 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:15,993 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:16,026 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:16,057 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:16,088 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:16,119 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:16,150 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:16,180 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:16,211 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:16,242 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:16,273 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:16,579 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.528817892074585 s; generated tokens: 20 tokens; generate speed: 13.082002836099905 tokens/s +2024-07-30 13:59:16,584 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:16,585 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[564/2067], cost time 1.5400s, every example cost time is 1.5400, generate speed: 12.9870 tokens/s, avg speed: 10.5807 tokens/s, remaining time: 0:34:36 +pred is: + ['Electorate of Brandenburg and Electorate of the Palatinate'] + label is: + ['Electorate of Brandenburg and Electorate of the Palatinate'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:59:16,668 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:16,668 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:16,668 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:16,669 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:16,669 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:17,612 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:17,644 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:17,675 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:17,706 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:17,736 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:17,767 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:17,798 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:17,800 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.131425380706787 s; generated tokens: 7 tokens; generate speed: 6.186886134397294 tokens/s +2024-07-30 13:59:17,805 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:17,805 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[565/2067], cost time 1.1425s, every example cost time is 1.1425, generate speed: 6.1271 tokens/s, avg speed: 10.5741 tokens/s, remaining time: 0:34:34 +pred is: + ['Hugues Capet'] + label is: + ['Hugues Capet'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:59:17,888 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:17,888 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 321, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:17,888 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:17,889 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:17,889 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:18,834 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:18,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:18,899 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:18,930 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:18,961 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:18,992 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:19,023 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:19,054 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:19,085 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:19,116 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:19,427 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5381808280944824 s; generated tokens: 20 tokens; generate speed: 13.002372435480327 tokens/s +2024-07-30 13:59:19,432 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:19,432 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[566/2067], cost time 1.5494s, every example cost time is 1.5494, generate speed: 12.9081 tokens/s, avg speed: 10.5788 tokens/s, remaining time: 0:34:33 +pred is: + ['Jacques Lefevre'] + label is: + ['Jacques Lefevre'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:59:19,521 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:19,521 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 253, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:19,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:19,522 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:19,522 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:20,466 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:20,499 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:20,531 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:20,562 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:20,592 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:20,623 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:20,654 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:20,685 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:20,716 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:20,747 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:21,057 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.534346580505371 s; generated tokens: 20 tokens; generate speed: 13.034864647994038 tokens/s +2024-07-30 13:59:21,062 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:21,062 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[567/2067], cost time 1.5511s, every example cost time is 1.5511, generate speed: 12.8943 tokens/s, avg speed: 10.5834 tokens/s, remaining time: 0:34:32 +pred is: + ['1572'] + label is: + ['24 August – 3 October 1572'] +The F1/Em of this example is: {'F1': 16.666666666666668, 'Em': 0.0} +2024-07-30 13:59:21,144 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:21,145 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:21,145 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:21,145 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:21,145 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:22,089 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:22,121 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:22,151 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:22,182 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:22,185 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.039381742477417 s; generated tokens: 4 tokens; generate speed: 3.8484416615456465 tokens/s +2024-07-30 13:59:22,190 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:22,190 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[568/2067], cost time 1.0505s, every example cost time is 1.0505, generate speed: 3.8077 tokens/s, avg speed: 10.5743 tokens/s, remaining time: 0:34:30 +pred is: + ['Louis XIV'] + label is: + ['Louis XIV'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:59:22,279 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:22,280 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 366, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:22,280 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:22,280 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:22,281 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:23,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:23,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:23,290 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:23,320 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:23,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:23,382 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:23,413 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:23,444 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:23,475 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:23,506 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:23,754 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4731099605560303 s; generated tokens: 18 tokens; generate speed: 12.219047105761094 tokens/s +2024-07-30 13:59:23,759 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:23,759 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[569/2067], cost time 1.4847s, every example cost time is 1.4847, generate speed: 12.1233 tokens/s, avg speed: 10.5772 tokens/s, remaining time: 0:34:29 +pred is: + ['Westchester'] + label is: + ['Westchester'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:59:23,841 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:23,842 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 185, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:23,842 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:23,842 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:23,842 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:24,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:24,818 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:24,849 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:24,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:24,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:24,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:24,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:25,008 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:25,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:25,070 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:25,378 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5353922843933105 s; generated tokens: 20 tokens; generate speed: 13.02598704141771 tokens/s +2024-07-30 13:59:25,383 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:25,383 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[570/2067], cost time 1.5465s, every example cost time is 1.5465, generate speed: 12.9321 tokens/s, avg speed: 10.5818 tokens/s, remaining time: 0:34:28 +pred is: + ['They adapted quickly and often married outside their immediate French communities, which led to their assimilation.'] + label is: + ['affiliated with other Protestant denominations'] +The F1/Em of this example is: {'F1': 4.761904761904762, 'Em': 0.0} +F1 score: 65.7841393293334, Em score: 53.333333333333336, current_count: 570 +2024-07-30 13:59:25,610 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:25,610 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 209, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:25,611 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:25,611 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:25,611 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:26,553 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:26,585 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:26,616 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:26,647 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:26,678 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:26,708 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:26,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:26,770 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:26,800 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:26,831 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:27,138 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5266976356506348 s; generated tokens: 20 tokens; generate speed: 13.100170939530258 tokens/s +2024-07-30 13:59:27,143 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:27,143 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[571/2067], cost time 1.5379s, every example cost time is 1.5379, generate speed: 13.0044 tokens/s, avg speed: 10.5866 tokens/s, remaining time: 0:34:27 +pred is: + ['Pierre Bayle'] + label is: + ['Pierre Bayle'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:59:27,225 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:27,226 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 224, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:27,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:27,226 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:27,226 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:28,170 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:28,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:28,233 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:28,264 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:28,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:28,325 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:28,356 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:28,387 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:28,418 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:28,449 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:28,757 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.530458688735962 s; generated tokens: 20 tokens; generate speed: 13.067977690086115 tokens/s +2024-07-30 13:59:28,762 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:28,762 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[572/2067], cost time 1.5416s, every example cost time is 1.5416, generate speed: 12.9736 tokens/s, avg speed: 10.5912 tokens/s, remaining time: 0:34:26 +pred is: + ['The French Protestant Church of London'] + label is: + ['The French Protestant Church of London'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:59:28,845 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:28,845 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 349, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:28,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:28,846 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:28,846 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:29,791 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:29,825 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:29,856 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:29,887 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:29,918 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:29,949 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:29,981 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:30,012 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:30,043 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:30,074 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:30,387 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5408132076263428 s; generated tokens: 20 tokens; generate speed: 12.98015872463246 tokens/s +2024-07-30 13:59:30,392 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:30,392 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[573/2067], cost time 1.5520s, every example cost time is 1.5520, generate speed: 12.8866 tokens/s, avg speed: 10.5957 tokens/s, remaining time: 0:34:25 +pred is: + ['Lutheran and Reformed'] + label is: + ['Lutheran and Reformed'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:59:30,475 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:30,475 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 218, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:30,476 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:30,476 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:30,476 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:31,420 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:31,459 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:31,490 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:31,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:31,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:31,583 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:31,587 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.110311508178711 s; generated tokens: 6 tokens; generate speed: 5.4038888688473055 tokens/s +2024-07-30 13:59:31,591 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:31,592 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[574/2067], cost time 1.1217s, every example cost time is 1.1217, generate speed: 5.3488 tokens/s, avg speed: 10.5883 tokens/s, remaining time: 0:34:23 +pred is: + ['Frederick William'] + label is: + ['Frederick William'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:59:31,674 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:31,674 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:31,675 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:31,675 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:31,675 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:32,617 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:32,649 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:32,680 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:32,711 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:32,742 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:32,773 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:32,804 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:32,835 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:32,866 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:32,897 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:33,207 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.531446933746338 s; generated tokens: 20 tokens; generate speed: 13.059544904422207 tokens/s +2024-07-30 13:59:33,212 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:33,212 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[575/2067], cost time 1.5428s, every example cost time is 1.5428, generate speed: 12.9637 tokens/s, avg speed: 10.5929 tokens/s, remaining time: 0:34:22 +pred is: + ['solar power'] + label is: + ['solar'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:59:33,294 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:33,294 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 199, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:33,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:33,295 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:33,295 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:34,239 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:34,271 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:34,302 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:34,333 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:34,364 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:34,395 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:34,398 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1020851135253906 s; generated tokens: 6 tokens; generate speed: 5.444225610494799 tokens/s +2024-07-30 13:59:34,402 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:34,403 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[576/2067], cost time 1.1133s, every example cost time is 1.1133, generate speed: 5.3894 tokens/s, avg speed: 10.5856 tokens/s, remaining time: 0:34:20 +pred is: + ['atmospheric engine'] + label is: + ['atmospheric engine'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:59:34,493 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:34,494 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 196, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:34,494 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:34,495 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:34,495 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:35,438 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:35,470 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:35,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:35,531 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:35,534 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.039308786392212 s; generated tokens: 4 tokens; generate speed: 3.848711809591581 tokens/s +2024-07-30 13:59:35,539 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:35,539 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[577/2067], cost time 1.0508s, every example cost time is 1.0508, generate speed: 3.8066 tokens/s, avg speed: 10.5767 tokens/s, remaining time: 0:34:18 +pred is: + ['United Kingdom'] + label is: + ['United Kingdom'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:59:35,621 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:35,622 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 152, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:35,622 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:35,622 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:35,622 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:36,565 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:36,598 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:36,630 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:36,633 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0099010467529297 s; generated tokens: 3 tokens; generate speed: 2.970588068648615 tokens/s +2024-07-30 13:59:36,637 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:36,638 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[578/2067], cost time 1.0211s, every example cost time is 1.0211, generate speed: 2.9381 tokens/s, avg speed: 10.5669 tokens/s, remaining time: 0:34:15 +pred is: + ['Injector'] + label is: + ['water pump'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:59:36,720 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:36,720 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 294, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:36,721 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:36,721 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:36,721 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:37,666 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:37,706 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:37,738 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:37,769 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:37,800 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:37,831 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:37,862 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:37,893 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:37,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:37,955 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:37,957 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2358946800231934 s; generated tokens: 10 tokens; generate speed: 8.09130434950358 tokens/s +2024-07-30 13:59:37,962 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:37,962 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[579/2067], cost time 1.2471s, every example cost time is 1.2471, generate speed: 8.0186 tokens/s, avg speed: 10.5629 tokens/s, remaining time: 0:34:14 +pred is: + ['3'] + label is: + ['three'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:59:38,044 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:38,045 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 281, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:38,045 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:38,045 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:38,045 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:38,990 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:39,023 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:39,061 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:39,091 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:39,122 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:39,153 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:39,184 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:39,214 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:39,245 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:39,276 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:39,596 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5507311820983887 s; generated tokens: 20 tokens; generate speed: 12.897141832755812 tokens/s +2024-07-30 13:59:39,601 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:39,602 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[580/2067], cost time 1.5620s, every example cost time is 1.5620, generate speed: 12.8043 tokens/s, avg speed: 10.5673 tokens/s, remaining time: 0:34:13 +pred is: + ['1'] + label is: + ['Corliss'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 65.7706196857242, Em score: 53.44827586206897, current_count: 580 +2024-07-30 13:59:39,830 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:39,830 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 163, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:39,831 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:39,831 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:39,831 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:40,774 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:40,806 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:40,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:40,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:40,899 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:40,930 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:40,932 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1011486053466797 s; generated tokens: 6 tokens; generate speed: 5.448855831871114 tokens/s +2024-07-30 13:59:40,937 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:40,937 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[581/2067], cost time 1.1125s, every example cost time is 1.1125, generate speed: 5.3935 tokens/s, avg speed: 10.5601 tokens/s, remaining time: 0:34:11 +pred is: + ['Lead fusible plugs'] + label is: + ['Lead fusible plugs'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:59:41,020 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:41,021 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 185, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:41,021 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:41,021 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:41,021 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:41,964 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:41,996 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:42,027 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:42,065 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:42,068 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0466411113739014 s; generated tokens: 4 tokens; generate speed: 3.821749362347609 tokens/s +2024-07-30 13:59:42,073 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:42,073 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[582/2067], cost time 1.0579s, every example cost time is 1.0579, generate speed: 3.7812 tokens/s, avg speed: 10.5512 tokens/s, remaining time: 0:34:08 +pred is: + ['James Watt'] + label is: + ['James Watt'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:59:42,155 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:42,155 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 223, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:42,156 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:42,156 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:42,156 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:43,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:43,132 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:43,163 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:43,194 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:43,225 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:43,255 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:43,286 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:43,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:43,348 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:43,379 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:43,686 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.530158519744873 s; generated tokens: 20 tokens; generate speed: 13.070541216432039 tokens/s +2024-07-30 13:59:43,691 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:43,692 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[583/2067], cost time 1.5414s, every example cost time is 1.5414, generate speed: 12.9752 tokens/s, avg speed: 10.5558 tokens/s, remaining time: 0:34:08 +pred is: + ['1'] + label is: + ['first'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:59:43,773 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:43,773 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 181, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:43,774 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:43,774 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:43,774 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:44,717 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:44,749 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:44,780 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:44,811 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:44,814 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0391356945037842 s; generated tokens: 4 tokens; generate speed: 3.849352900835641 tokens/s +2024-07-30 13:59:44,818 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:44,819 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[584/2067], cost time 1.0502s, every example cost time is 1.0502, generate speed: 3.8086 tokens/s, avg speed: 10.5470 tokens/s, remaining time: 0:34:05 +pred is: + ['Compound engines'] + label is: + ['compound'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:59:44,900 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:44,901 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:44,901 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:44,901 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:44,901 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:45,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:45,877 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:45,908 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:45,939 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:45,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:46,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:46,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:46,063 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:46,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:46,125 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:46,128 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.226593255996704 s; generated tokens: 10 tokens; generate speed: 8.15266181442862 tokens/s +2024-07-30 13:59:46,133 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:46,133 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[585/2067], cost time 1.2378s, every example cost time is 1.2378, generate speed: 8.0791 tokens/s, avg speed: 10.5433 tokens/s, remaining time: 0:34:04 +pred is: + ['steam turbines'] + label is: + ['steam turbines'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:59:46,216 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:46,216 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 147, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:46,217 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:46,217 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:46,217 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:47,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:47,191 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:47,222 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:47,253 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:47,283 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:47,314 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:47,317 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0998985767364502 s; generated tokens: 6 tokens; generate speed: 5.455048426194733 tokens/s +2024-07-30 13:59:47,322 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:47,322 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[586/2067], cost time 1.1111s, every example cost time is 1.1111, generate speed: 5.4003 tokens/s, avg speed: 10.5362 tokens/s, remaining time: 0:34:02 +pred is: + ['Combustible materials'] + label is: + ['burning combustible materials'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 13:59:47,409 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:47,410 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 172, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:47,410 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:47,410 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:47,411 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:48,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:48,386 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:48,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:48,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:48,479 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:48,509 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:48,540 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:48,571 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:48,601 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:48,632 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:48,940 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5297036170959473 s; generated tokens: 20 tokens; generate speed: 13.074428128743547 tokens/s +2024-07-30 13:59:48,945 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:48,946 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[587/2067], cost time 1.5413s, every example cost time is 1.5413, generate speed: 12.9761 tokens/s, avg speed: 10.5408 tokens/s, remaining time: 0:34:01 +pred is: + ['1'] + label is: + ['steam engine indicator'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:59:49,029 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:49,029 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 234, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:49,030 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:49,030 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:49,030 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:49,975 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:50,008 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:50,039 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:50,070 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:50,072 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0419399738311768 s; generated tokens: 4 tokens; generate speed: 3.838992744747224 tokens/s +2024-07-30 13:59:50,077 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:50,078 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[588/2067], cost time 1.0531s, every example cost time is 1.0531, generate speed: 3.7982 tokens/s, avg speed: 10.5321 tokens/s, remaining time: 0:33:58 +pred is: + ['90°'] + label is: + ['90'] +The F1/Em of this example is: {'F1': 66.66666666666666, 'Em': 0.0} +2024-07-30 13:59:50,160 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:50,160 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 172, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:50,161 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:50,161 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:50,161 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:51,104 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:51,135 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:51,166 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:51,197 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:51,200 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0383517742156982 s; generated tokens: 4 tokens; generate speed: 3.852259031407091 tokens/s +2024-07-30 13:59:51,204 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:51,205 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[589/2067], cost time 1.0494s, every example cost time is 1.0494, generate speed: 3.8118 tokens/s, avg speed: 10.5234 tokens/s, remaining time: 0:33:56 +pred is: + ['Counterflow'] + label is: + ['counterflow'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:59:51,287 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:51,287 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 249, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:51,287 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:51,287 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:51,288 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:52,231 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:52,263 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:52,294 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:52,325 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:52,356 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:52,386 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:52,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:52,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:52,478 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:52,509 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:52,573 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2853314876556396 s; generated tokens: 12 tokens; generate speed: 9.336112991277615 tokens/s +2024-07-30 13:59:52,578 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:52,578 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[590/2067], cost time 1.2964s, every example cost time is 1.2964, generate speed: 9.2563 tokens/s, avg speed: 10.5214 tokens/s, remaining time: 0:33:55 +pred is: + ['Uniflow engine'] + label is: + ['Quasiturbine'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 65.65868827862154, Em score: 53.220338983050844, current_count: 590 +2024-07-30 13:59:52,809 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:52,809 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:52,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:52,810 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:52,810 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:53,755 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:53,789 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:53,820 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:53,851 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:53,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:53,912 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:53,915 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1044600009918213 s; generated tokens: 6 tokens; generate speed: 5.432519054209217 tokens/s +2024-07-30 13:59:53,920 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:53,920 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[591/2067], cost time 1.1160s, every example cost time is 1.1160, generate speed: 5.3762 tokens/s, avg speed: 10.5143 tokens/s, remaining time: 0:33:53 +pred is: + ['Oscillating'] + label is: + ['oscillating cylinder'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 13:59:54,004 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:54,004 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 166, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:54,005 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:54,005 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:54,005 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:54,948 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:54,980 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:55,011 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:55,041 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:55,072 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:55,103 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:55,105 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0998718738555908 s; generated tokens: 6 tokens; generate speed: 5.455180864810239 tokens/s +2024-07-30 13:59:55,110 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:55,110 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[592/2067], cost time 1.1117s, every example cost time is 1.1117, generate speed: 5.3972 tokens/s, avg speed: 10.5073 tokens/s, remaining time: 0:33:50 +pred is: + ['It is recycled continuously'] + label is: + ['recycled continuously'] +The F1/Em of this example is: {'F1': 60.0, 'Em': 0.0} +2024-07-30 13:59:55,192 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:55,193 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 185, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:55,193 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:55,193 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:55,193 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:56,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:56,168 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:56,200 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:56,231 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:56,262 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:56,293 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:56,324 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:56,326 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.132885456085205 s; generated tokens: 7 tokens; generate speed: 6.17891240672219 tokens/s +2024-07-30 13:59:56,331 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:56,332 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[593/2067], cost time 1.1439s, every example cost time is 1.1439, generate speed: 6.1192 tokens/s, avg speed: 10.5012 tokens/s, remaining time: 0:33:49 +pred is: + ['1'] + label is: + ['working fluid'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:59:56,414 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:56,414 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 149, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:56,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:56,415 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:56,415 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:57,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:57,389 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:57,420 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:57,451 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:57,481 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:57,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:57,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:57,573 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:57,604 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:57,634 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:57,941 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5258350372314453 s; generated tokens: 20 tokens; generate speed: 13.10757684283423 tokens/s +2024-07-30 13:59:57,946 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:57,946 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[594/2067], cost time 1.5369s, every example cost time is 1.5369, generate speed: 13.0128 tokens/s, avg speed: 10.5059 tokens/s, remaining time: 0:33:48 +pred is: + ['1'] + label is: + ['Steam engines'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 13:59:58,028 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:58,029 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 189, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:58,029 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:58,029 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:58,030 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 13:59:58,973 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:59,005 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:59,036 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:59,067 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:59,098 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:59,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:59,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:59,190 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:59,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:59,251 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:59,254 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2242474555969238 s; generated tokens: 10 tokens; generate speed: 8.16828326191959 tokens/s +2024-07-30 13:59:59,260 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 13:59:59,260 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[595/2067], cost time 1.2367s, every example cost time is 1.2367, generate speed: 8.0861 tokens/s, avg speed: 10.5022 tokens/s, remaining time: 0:33:46 +pred is: + ['Catch Me Who Can'] + label is: + ['Catch Me Who Can'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 13:59:59,342 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 13:59:59,343 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 225, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 13:59:59,343 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 13:59:59,343 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 13:59:59,344 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:00,288 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:00,321 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:00,352 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:00,383 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:00,385 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.041431188583374 s; generated tokens: 4 tokens; generate speed: 3.8408682626848094 tokens/s +2024-07-30 14:00:00,390 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:00,390 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[596/2067], cost time 1.0526s, every example cost time is 1.0526, generate speed: 3.8000 tokens/s, avg speed: 10.4936 tokens/s, remaining time: 0:33:44 +pred is: + ['Arthur Woolf'] + label is: + ['Arthur Woolf'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:00:00,473 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:00,473 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 241, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:00,474 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:00,474 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:00,474 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:01,418 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:01,451 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:01,483 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:01,514 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:01,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:01,576 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:01,607 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:01,638 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:01,669 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:01,699 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:02,008 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5336401462554932 s; generated tokens: 20 tokens; generate speed: 13.040868843210465 tokens/s +2024-07-30 14:00:02,013 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:02,013 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[597/2067], cost time 1.5450s, every example cost time is 1.5450, generate speed: 12.9452 tokens/s, avg speed: 10.4983 tokens/s, remaining time: 0:33:43 +pred is: + ['90'] + label is: + ['90'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:00:02,096 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:02,096 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:02,096 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:02,097 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:02,097 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:03,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:03,073 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:03,105 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:03,137 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:03,168 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:03,199 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:03,202 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1048061847686768 s; generated tokens: 6 tokens; generate speed: 5.4308168099695004 tokens/s +2024-07-30 14:00:03,207 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:03,207 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[598/2067], cost time 1.1159s, every example cost time is 1.1159, generate speed: 5.3769 tokens/s, avg speed: 10.4913 tokens/s, remaining time: 0:33:41 +pred is: + ['The Rankine cycle'] + label is: + ['Rankine cycle'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:00:03,289 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:03,289 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 195, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:03,289 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:03,290 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:03,290 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:04,232 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:04,265 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:04,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:04,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:04,358 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:04,389 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:04,420 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:04,451 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:04,481 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:04,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:04,820 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5297868251800537 s; generated tokens: 20 tokens; generate speed: 13.07371698514009 tokens/s +2024-07-30 14:00:04,824 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:04,825 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[599/2067], cost time 1.5408s, every example cost time is 1.5408, generate speed: 12.9802 tokens/s, avg speed: 10.4960 tokens/s, remaining time: 0:33:40 +pred is: + ['By the amount of work it could do'] + label is: + ['duty'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:00:04,907 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:04,907 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 156, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:04,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:04,907 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:04,908 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:05,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:05,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:05,914 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:05,945 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:05,976 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:06,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:06,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:06,040 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1323473453521729 s; generated tokens: 7 tokens; generate speed: 6.181848731073698 tokens/s +2024-07-30 14:00:06,045 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:06,045 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[600/2067], cost time 1.1434s, every example cost time is 1.1434, generate speed: 6.1220 tokens/s, avg speed: 10.4899 tokens/s, remaining time: 0:33:38 +pred is: + ['Turbine steam engines'] + label is: + ['steam turbines'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +F1 score: 65.45604347397784, Em score: 52.833333333333336, current_count: 600 +2024-07-30 14:00:06,279 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:06,279 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 223, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:06,279 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:06,280 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:06,280 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:07,223 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:07,256 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:07,287 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:07,319 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:07,349 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:07,380 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:07,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:07,442 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:07,473 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:07,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:07,537 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.25687575340271 s; generated tokens: 11 tokens; generate speed: 8.751859497822247 tokens/s +2024-07-30 14:00:07,542 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:07,542 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[601/2067], cost time 1.2685s, every example cost time is 1.2685, generate speed: 8.6720 tokens/s, avg speed: 10.4871 tokens/s, remaining time: 0:33:36 +pred is: + ['Thomas Savery'] + label is: + ['Thomas Savery'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:00:07,624 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:07,624 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 164, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:07,625 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:07,625 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:07,625 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:08,567 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:08,600 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:08,632 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:08,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:08,694 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:08,725 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:08,756 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:08,787 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:08,818 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:08,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:09,006 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3803160190582275 s; generated tokens: 15 tokens; generate speed: 10.86707666425136 tokens/s +2024-07-30 14:00:09,010 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:09,011 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[602/2067], cost time 1.3915s, every example cost time is 1.3915, generate speed: 10.7799 tokens/s, avg speed: 10.4876 tokens/s, remaining time: 0:33:35 +pred is: + ['1'] + label is: + ['Richard Trevithick'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:00:09,093 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:09,093 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 174, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:09,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:09,094 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:09,094 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:10,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:10,070 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:10,102 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:10,133 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:10,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:10,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:10,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:10,228 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1340751647949219 s; generated tokens: 7 tokens; generate speed: 6.172430379661678 tokens/s +2024-07-30 14:00:10,233 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:10,233 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[603/2067], cost time 1.1452s, every example cost time is 1.1452, generate speed: 6.1126 tokens/s, avg speed: 10.4816 tokens/s, remaining time: 0:33:33 +pred is: + ['Energiprojekt AB'] + label is: + ['Energiprojekt AB'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:00:10,315 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:10,315 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 283, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:10,316 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:10,316 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:10,316 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:11,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:11,294 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:11,326 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:11,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:11,388 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:11,419 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:11,450 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:11,481 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:11,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:11,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:11,854 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.537248134613037 s; generated tokens: 20 tokens; generate speed: 13.010261355779422 tokens/s +2024-07-30 14:00:11,859 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:11,859 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[604/2067], cost time 1.5486s, every example cost time is 1.5486, generate speed: 12.9152 tokens/s, avg speed: 10.4861 tokens/s, remaining time: 0:33:32 +pred is: + ['1'] + label is: + ['surface condensers'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:00:11,941 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:11,942 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:11,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:11,942 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:11,943 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:12,885 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:12,918 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:12,949 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:12,980 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:13,011 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:13,042 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:13,073 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:13,104 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:13,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:13,165 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:13,473 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5297291278839111 s; generated tokens: 20 tokens; generate speed: 13.074210090819275 tokens/s +2024-07-30 14:00:13,477 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:13,478 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[605/2067], cost time 1.5409s, every example cost time is 1.5409, generate speed: 12.9792 tokens/s, avg speed: 10.4907 tokens/s, remaining time: 0:33:31 +pred is: + ['1'] + label is: + ['centrifugal governor'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:00:13,560 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:13,561 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 146, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:13,561 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:13,561 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:13,562 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:14,504 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:14,535 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:14,566 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:14,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:14,627 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:14,658 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:14,689 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:14,720 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:14,751 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:14,781 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:15,088 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5266807079315186 s; generated tokens: 20 tokens; generate speed: 13.100316193225341 tokens/s +2024-07-30 14:00:15,093 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:15,093 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[606/2067], cost time 1.5379s, every example cost time is 1.5379, generate speed: 13.0047 tokens/s, avg speed: 10.4953 tokens/s, remaining time: 0:33:30 +pred is: + ['1880'] + label is: + ['1880'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:00:15,176 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:15,177 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 190, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:15,177 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:15,177 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:15,177 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:16,120 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:16,154 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:16,185 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:16,216 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:16,247 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:16,278 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:16,281 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.103515625 s; generated tokens: 6 tokens; generate speed: 5.43716814159292 tokens/s +2024-07-30 14:00:16,286 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:16,286 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[607/2067], cost time 1.1146s, every example cost time is 1.1146, generate speed: 5.3831 tokens/s, avg speed: 10.4885 tokens/s, remaining time: 0:33:28 +pred is: + ['Shortening the cutoff'] + label is: + ['shortening the cutoff'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:00:16,369 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:16,369 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 181, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:16,370 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:16,370 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:16,370 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:17,313 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:17,346 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:17,377 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:17,380 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0098707675933838 s; generated tokens: 3 tokens; generate speed: 2.9706771363916986 tokens/s +2024-07-30 14:00:17,385 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:17,385 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[608/2067], cost time 1.0209s, every example cost time is 1.0209, generate speed: 2.9387 tokens/s, avg speed: 10.4793 tokens/s, remaining time: 0:33:26 +pred is: + ['1'] + label is: + ['Jerónimo de Ayanz y Beaumont'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:00:17,467 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:17,467 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 352, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:17,468 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:17,468 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:17,468 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:18,414 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:18,447 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:18,478 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:18,510 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:18,513 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.044480323791504 s; generated tokens: 4 tokens; generate speed: 3.8296556755419244 tokens/s +2024-07-30 14:00:18,518 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:18,518 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[609/2067], cost time 1.0555s, every example cost time is 1.0555, generate speed: 3.7898 tokens/s, avg speed: 10.4709 tokens/s, remaining time: 0:33:24 +pred is: + ['Blades'] + label is: + ['rotating discs'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:00:18,600 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:18,600 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 169, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:18,601 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:18,601 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:18,601 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:19,544 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:19,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:19,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:19,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:19,682 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:19,713 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:19,745 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:19,775 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:19,806 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:19,838 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:20,156 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5544750690460205 s; generated tokens: 20 tokens; generate speed: 12.866079616364626 tokens/s +2024-07-30 14:00:20,160 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:20,161 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[610/2067], cost time 1.5656s, every example cost time is 1.5656, generate speed: 12.7743 tokens/s, avg speed: 10.4752 tokens/s, remaining time: 0:33:23 +pred is: + ['1'] + label is: + ['lower'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 65.03873128587985, Em score: 52.622950819672134, current_count: 610 +2024-07-30 14:00:20,396 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:20,396 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 190, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:20,397 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:20,397 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:20,397 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:21,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:21,375 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:21,406 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:21,437 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:21,468 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:21,499 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:21,502 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1044917106628418 s; generated tokens: 6 tokens; generate speed: 5.432363087993846 tokens/s +2024-07-30 14:00:21,507 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:21,507 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[611/2067], cost time 1.1160s, every example cost time is 1.1160, generate speed: 5.3763 tokens/s, avg speed: 10.4684 tokens/s, remaining time: 0:33:21 +pred is: + ['Wankel engine'] + label is: + ['Wankel'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:00:21,588 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:21,589 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 176, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:21,589 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:21,589 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:21,590 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:22,532 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:22,565 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:22,596 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:22,626 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:22,657 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:22,688 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:22,719 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:22,750 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:22,781 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:22,812 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:23,120 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.530181646347046 s; generated tokens: 20 tokens; generate speed: 13.070343673083105 tokens/s +2024-07-30 14:00:23,125 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:23,125 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[612/2067], cost time 1.5414s, every example cost time is 1.5414, generate speed: 12.9755 tokens/s, avg speed: 10.4730 tokens/s, remaining time: 0:33:20 +pred is: + ['1763-1775'] + label is: + ['1775'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:00:23,207 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:23,207 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 210, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:23,208 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:23,208 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:23,208 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:24,151 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:24,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:24,214 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:24,217 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0088729858398438 s; generated tokens: 3 tokens; generate speed: 2.9736151548379777 tokens/s +2024-07-30 14:00:24,222 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:24,222 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[613/2067], cost time 1.0197s, every example cost time is 1.0197, generate speed: 2.9420 tokens/s, avg speed: 10.4639 tokens/s, remaining time: 0:33:17 +pred is: + ['2'] + label is: + ['two'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:00:24,331 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:24,332 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 156, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:24,332 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:24,332 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:24,333 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:25,275 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:25,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:25,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:25,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:25,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:25,431 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:25,461 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:25,492 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:25,495 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1623399257659912 s; generated tokens: 8 tokens; generate speed: 6.882668161577549 tokens/s +2024-07-30 14:00:25,500 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:25,500 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[614/2067], cost time 1.1738s, every example cost time is 1.1738, generate speed: 6.8153 tokens/s, avg speed: 10.4588 tokens/s, remaining time: 0:33:16 +pred is: + ['The Corliss steam engine'] + label is: + ['Corliss steam engine'] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +2024-07-30 14:00:25,582 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:25,582 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 211, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:25,583 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:25,583 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:25,583 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:26,526 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:26,558 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:26,589 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:26,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:26,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:26,654 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0705275535583496 s; generated tokens: 5 tokens; generate speed: 4.670594403086957 tokens/s +2024-07-30 14:00:26,658 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:26,659 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[615/2067], cost time 1.0814s, every example cost time is 1.0814, generate speed: 4.6236 tokens/s, avg speed: 10.4513 tokens/s, remaining time: 0:33:14 +pred is: + ['Thermodynamics'] + label is: + ['thermodynamic'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:00:26,740 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:26,740 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 180, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:26,741 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:26,741 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:26,741 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:27,684 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:27,717 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:27,748 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:27,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:27,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:27,841 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:27,871 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:27,902 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:27,933 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:27,964 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:28,272 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5305180549621582 s; generated tokens: 20 tokens; generate speed: 13.067470805167664 tokens/s +2024-07-30 14:00:28,277 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:28,277 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[616/2067], cost time 1.5417s, every example cost time is 1.5417, generate speed: 12.9731 tokens/s, avg speed: 10.4559 tokens/s, remaining time: 0:33:13 +pred is: + ['1'] + label is: + ['during the compression stage relatively little work is required to drive the pump'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:00:28,360 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:28,360 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 160, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:28,361 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:28,361 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:28,361 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:29,304 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:29,336 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:29,367 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:29,370 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0088567733764648 s; generated tokens: 3 tokens; generate speed: 2.9736629412315203 tokens/s +2024-07-30 14:00:29,375 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:29,375 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[617/2067], cost time 1.0201s, every example cost time is 1.0201, generate speed: 2.9409 tokens/s, avg speed: 10.4469 tokens/s, remaining time: 0:33:10 +pred is: + ['Injector'] + label is: + ['injector'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:00:29,488 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:29,489 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 169, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:29,489 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:29,490 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:29,490 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:30,434 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:30,468 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:30,499 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:30,530 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:30,561 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:30,592 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:30,623 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:30,653 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:30,684 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:30,715 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:31,024 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5337028503417969 s; generated tokens: 20 tokens; generate speed: 13.040335678806917 tokens/s +2024-07-30 14:00:31,028 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:31,029 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[618/2067], cost time 1.5454s, every example cost time is 1.5454, generate speed: 12.9417 tokens/s, avg speed: 10.4514 tokens/s, remaining time: 0:33:09 +pred is: + ['1'] + label is: + ['feed water'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:00:31,111 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:31,111 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 234, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:31,111 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:31,112 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:31,112 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:32,055 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:32,088 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:32,118 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:32,150 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:32,180 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:32,211 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:32,242 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:32,273 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:32,319 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:32,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:32,597 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4851832389831543 s; generated tokens: 18 tokens; generate speed: 12.119716629931727 tokens/s +2024-07-30 14:00:32,602 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:32,602 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[619/2067], cost time 1.4964s, every example cost time is 1.4964, generate speed: 12.0291 tokens/s, avg speed: 10.4542 tokens/s, remaining time: 0:33:08 +pred is: + ['1'] + label is: + ['water'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:00:32,684 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:32,684 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 239, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:32,685 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:32,685 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:32,685 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:33,629 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:33,662 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:33,692 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:33,724 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:33,754 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:33,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:33,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:33,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:33,877 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:33,908 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:34,216 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5310964584350586 s; generated tokens: 20 tokens; generate speed: 13.062534296788918 tokens/s +2024-07-30 14:00:34,221 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:34,221 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[620/2067], cost time 1.5422s, every example cost time is 1.5422, generate speed: 12.9681 tokens/s, avg speed: 10.4587 tokens/s, remaining time: 0:33:07 +pred is: + ['A practical Carnot cycle'] + label is: + ['practical Carnot cycle'] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +F1 score: 64.50047217911833, Em score: 51.935483870967744, current_count: 620 +2024-07-30 14:00:34,491 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:34,491 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 223, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:34,492 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:34,492 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:34,492 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:35,436 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:35,468 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:35,499 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:35,501 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.008871078491211 s; generated tokens: 3 tokens; generate speed: 2.9736207766869147 tokens/s +2024-07-30 14:00:35,506 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:35,506 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[621/2067], cost time 1.0204s, every example cost time is 1.0204, generate speed: 2.9399 tokens/s, avg speed: 10.4497 tokens/s, remaining time: 0:33:05 +pred is: + ['8'] + label is: + ['8'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:00:35,588 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:35,588 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 248, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:35,589 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:35,589 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:35,589 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:36,533 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:36,565 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:36,596 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:36,599 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0099384784698486 s; generated tokens: 3 tokens; generate speed: 2.97047796866328 tokens/s +2024-07-30 14:00:36,604 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:36,604 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[622/2067], cost time 1.0210s, every example cost time is 1.0210, generate speed: 2.9383 tokens/s, avg speed: 10.4408 tokens/s, remaining time: 0:33:03 +pred is: + ['1'] + label is: + ['photosynthesis'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:00:36,685 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:36,686 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 171, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:36,686 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:36,686 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:36,686 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:37,629 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:37,660 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:37,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:37,722 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:37,725 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.038194179534912 s; generated tokens: 4 tokens; generate speed: 3.8528437924704133 tokens/s +2024-07-30 14:00:37,729 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:37,730 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[623/2067], cost time 1.0491s, every example cost time is 1.0491, generate speed: 3.8129 tokens/s, avg speed: 10.4326 tokens/s, remaining time: 0:33:01 +pred is: + ['Robert Boyle'] + label is: + ['Robert Boyle'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:00:37,812 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:37,812 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 244, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:37,813 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:37,813 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:37,813 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:38,757 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:38,789 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:38,820 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:38,851 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:38,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:38,913 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:38,943 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:38,974 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:39,005 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:39,036 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:39,344 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.531238317489624 s; generated tokens: 20 tokens; generate speed: 13.061324139790882 tokens/s +2024-07-30 14:00:39,349 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:39,350 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[624/2067], cost time 1.5425s, every example cost time is 1.5425, generate speed: 12.9658 tokens/s, avg speed: 10.4372 tokens/s, remaining time: 0:33:00 +pred is: + ['1'] + label is: + ['Joseph Priestley'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:00:39,432 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:39,432 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 183, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:39,433 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:39,433 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:39,433 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:40,376 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:40,410 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:40,441 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:40,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:40,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:40,534 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:40,564 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:40,595 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:40,626 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:40,656 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:40,964 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5309617519378662 s; generated tokens: 20 tokens; generate speed: 13.06368364505797 tokens/s +2024-07-30 14:00:40,969 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:40,969 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[625/2067], cost time 1.5423s, every example cost time is 1.5423, generate speed: 12.9674 tokens/s, avg speed: 10.4417 tokens/s, remaining time: 0:32:59 +pred is: + ['Leonardo da Vinci'] + label is: + ['Leonardo da Vinci'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:00:41,052 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:41,052 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 160, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:41,053 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:41,053 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:41,053 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:41,996 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:42,028 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:42,059 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:42,090 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:42,121 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:42,151 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:42,182 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:42,185 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.131279706954956 s; generated tokens: 7 tokens; generate speed: 6.187682813511935 tokens/s +2024-07-30 14:00:42,189 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:42,190 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[626/2067], cost time 1.1423s, every example cost time is 1.1423, generate speed: 6.1278 tokens/s, avg speed: 10.4360 tokens/s, remaining time: 0:32:57 +pred is: + ['An ignition event'] + label is: + ['heat or a spark'] +The F1/Em of this example is: {'F1': 16.666666666666664, 'Em': 0.0} +2024-07-30 14:00:42,271 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:42,272 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 171, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:42,272 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:42,272 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:42,273 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:43,215 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:43,247 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:43,278 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:43,334 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:43,364 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:43,395 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:43,426 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:43,457 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:43,488 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:43,519 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:43,583 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3105013370513916 s; generated tokens: 12 tokens; generate speed: 9.156801035395981 tokens/s +2024-07-30 14:00:43,588 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:43,588 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[627/2067], cost time 1.3216s, every example cost time is 1.3216, generate speed: 9.0801 tokens/s, avg speed: 10.4339 tokens/s, remaining time: 0:32:55 +pred is: + ['1'] + label is: + ['pure O'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:00:43,670 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:43,670 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 199, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:43,671 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:43,671 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:43,671 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:44,614 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:44,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:44,677 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:44,708 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:44,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:44,770 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:44,800 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:44,803 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.131819725036621 s; generated tokens: 7 tokens; generate speed: 6.184730523028752 tokens/s +2024-07-30 14:00:44,808 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:44,808 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[628/2067], cost time 1.1430s, every example cost time is 1.1430, generate speed: 6.1241 tokens/s, avg speed: 10.4282 tokens/s, remaining time: 0:32:54 +pred is: + ['Silica SiO2'] + label is: + ['oxides of silicon'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 14:00:44,919 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:44,919 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 197, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:44,920 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:44,920 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:44,920 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:45,864 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:45,896 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:45,927 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:45,957 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:45,988 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:46,018 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:46,049 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:46,079 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:46,110 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:46,141 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:46,448 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5275115966796875 s; generated tokens: 20 tokens; generate speed: 13.09319028639356 tokens/s +2024-07-30 14:00:46,453 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:46,453 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[629/2067], cost time 1.5671s, every example cost time is 1.5671, generate speed: 12.7623 tokens/s, avg speed: 10.4324 tokens/s, remaining time: 0:32:53 +pred is: + ['1'] + label is: + ['monatomic'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:00:46,535 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:46,535 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 213, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:46,535 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:46,536 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:46,536 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:47,479 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:47,511 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:47,542 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:47,573 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:47,604 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:47,634 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:47,665 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:47,695 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:47,726 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:47,757 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:47,790 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.254213809967041 s; generated tokens: 11 tokens; generate speed: 8.77043444473719 tokens/s +2024-07-30 14:00:47,795 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:47,795 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[630/2067], cost time 1.2652s, every example cost time is 1.2652, generate speed: 8.6944 tokens/s, avg speed: 10.4299 tokens/s, remaining time: 0:32:51 +pred is: + ['Phlogiston'] + label is: + ['phlogiston'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.17771336146038, Em score: 51.74603174603175, current_count: 630 +2024-07-30 14:00:48,034 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:48,034 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 244, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:48,034 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:48,035 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:48,035 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:48,979 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:49,012 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:49,043 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:49,074 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:49,104 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:49,135 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:49,166 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:49,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:49,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:49,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:49,572 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5372130870819092 s; generated tokens: 20 tokens; generate speed: 13.010557981890454 tokens/s +2024-07-30 14:00:49,577 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:49,577 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[631/2067], cost time 1.5484s, every example cost time is 1.5484, generate speed: 12.9169 tokens/s, avg speed: 10.4343 tokens/s, remaining time: 0:32:50 +pred is: + ['1'] + label is: + ['covalent double bond'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:00:49,689 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:49,689 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 246, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:49,689 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:49,690 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:49,690 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:50,634 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:50,666 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:50,697 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:50,727 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:50,758 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:50,789 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:50,820 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:50,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:50,881 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:50,912 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:50,945 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.254908561706543 s; generated tokens: 11 tokens; generate speed: 8.765578892091678 tokens/s +2024-07-30 14:00:50,950 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:50,950 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[632/2067], cost time 1.2665s, every example cost time is 1.2665, generate speed: 8.6853 tokens/s, avg speed: 10.4318 tokens/s, remaining time: 0:32:48 +pred is: + ['1773'] + label is: + ['1773'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:00:51,032 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:51,032 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 205, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:51,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:51,033 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:51,033 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:51,975 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:52,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:52,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:52,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:52,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:52,102 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0693151950836182 s; generated tokens: 5 tokens; generate speed: 4.675889787210038 tokens/s +2024-07-30 14:00:52,107 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:52,107 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[633/2067], cost time 1.0802s, every example cost time is 1.0802, generate speed: 4.6289 tokens/s, avg speed: 10.4246 tokens/s, remaining time: 0:32:46 +pred is: + ['Spin triplet state'] + label is: + ['spin triplet state'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:00:52,189 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:52,189 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 230, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:52,190 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:52,190 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:52,190 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:53,133 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:53,165 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:53,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:53,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:53,229 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0383760929107666 s; generated tokens: 4 tokens; generate speed: 3.8521688117714996 tokens/s +2024-07-30 14:00:53,233 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:53,233 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[634/2067], cost time 1.0491s, every example cost time is 1.0491, generate speed: 3.8128 tokens/s, avg speed: 10.4166 tokens/s, remaining time: 0:32:44 +pred is: + ['Nitrogen'] + label is: + ['air'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:00:53,316 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:53,316 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 308, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:53,316 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:53,317 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:53,317 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:54,262 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:54,294 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:54,297 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 0.980191707611084 s; generated tokens: 2 tokens; generate speed: 2.0404171800987636 tokens/s +2024-07-30 14:00:54,302 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:54,302 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[635/2067], cost time 0.9911s, every example cost time is 0.9911, generate speed: 2.0179 tokens/s, avg speed: 10.4070 tokens/s, remaining time: 0:32:42 +pred is: + ['ozone'] + label is: + ['ozone'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:00:54,384 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:54,385 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 191, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:54,385 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:54,385 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:54,386 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:55,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:55,361 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:55,392 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:55,395 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.009117841720581 s; generated tokens: 3 tokens; generate speed: 2.972893626461797 tokens/s +2024-07-30 14:00:55,400 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:55,400 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[636/2067], cost time 1.0201s, every example cost time is 1.0201, generate speed: 2.9410 tokens/s, avg speed: 10.3983 tokens/s, remaining time: 0:32:40 +pred is: + ['1'] + label is: + ['dioxygen'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:00:55,481 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:55,481 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 175, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:55,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:55,482 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:55,482 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:56,424 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:56,456 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:56,487 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:56,517 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:56,572 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:56,575 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0920486450195312 s; generated tokens: 5 tokens; generate speed: 4.57855061933672 tokens/s +2024-07-30 14:00:56,579 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:56,579 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[637/2067], cost time 1.1030s, every example cost time is 1.1030, generate speed: 4.5329 tokens/s, avg speed: 10.3909 tokens/s, remaining time: 0:32:38 +pred is: + ['James Dewar'] + label is: + ['James Dewar'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:00:56,661 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:56,662 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 246, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:56,662 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:56,662 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:56,663 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:57,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:57,638 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:57,670 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:57,700 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:57,703 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0402038097381592 s; generated tokens: 4 tokens; generate speed: 3.845400259596129 tokens/s +2024-07-30 14:00:57,708 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:57,708 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[638/2067], cost time 1.0511s, every example cost time is 1.0511, generate speed: 3.8055 tokens/s, avg speed: 10.3829 tokens/s, remaining time: 0:32:36 +pred is: + ['Oxygen'] + label is: + ['Oxygen'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:00:57,790 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:57,790 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 247, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:57,791 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:57,791 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:57,791 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:00:58,735 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:58,767 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:58,798 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:58,829 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:58,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:58,890 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:58,921 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:58,952 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:58,982 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:59,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:59,320 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5292620658874512 s; generated tokens: 20 tokens; generate speed: 13.078203171405898 tokens/s +2024-07-30 14:00:59,325 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:00:59,325 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[639/2067], cost time 1.5402s, every example cost time is 1.5402, generate speed: 12.9853 tokens/s, avg speed: 10.3875 tokens/s, remaining time: 0:32:35 +pred is: + ['1'] + label is: + ['most abundant'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:00:59,407 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:00:59,408 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 241, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:00:59,408 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:00:59,408 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:00:59,408 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:00,352 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:00,386 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:00,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:00,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:00,479 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:00,509 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:00,540 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:00,571 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:00,602 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:00,632 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:00,666 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2569763660430908 s; generated tokens: 11 tokens; generate speed: 8.751158969382647 tokens/s +2024-07-30 14:01:00,670 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:00,671 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[640/2067], cost time 1.2680s, every example cost time is 1.2680, generate speed: 8.6752 tokens/s, avg speed: 10.3850 tokens/s, remaining time: 0:32:33 +pred is: + ['19th'] + label is: + ['late 19th'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +F1 score: 64.03431159018756, Em score: 51.71875, current_count: 640 +2024-07-30 14:01:00,923 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:00,923 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 181, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:00,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:00,924 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:00,924 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:01,866 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:01,898 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:01,929 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:01,960 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:01,990 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:02,021 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:02,024 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0994117259979248 s; generated tokens: 6 tokens; generate speed: 5.457464076575917 tokens/s +2024-07-30 14:01:02,028 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:02,028 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[641/2067], cost time 1.1108s, every example cost time is 1.1108, generate speed: 5.4014 tokens/s, avg speed: 10.3787 tokens/s, remaining time: 0:32:31 +pred is: + ['1'] + label is: + ['Sun'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:01:02,111 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:02,111 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 193, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:02,112 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:02,112 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:02,112 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:03,055 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:03,087 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:03,118 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:03,148 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:03,151 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0387816429138184 s; generated tokens: 4 tokens; generate speed: 3.850664889283047 tokens/s +2024-07-30 14:01:03,156 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:03,156 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[642/2067], cost time 1.0497s, every example cost time is 1.0497, generate speed: 3.8105 tokens/s, avg speed: 10.3709 tokens/s, remaining time: 0:32:29 +pred is: + ['Singlet oxygen'] + label is: + ['Singlet'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:01:03,239 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:03,239 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 228, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:03,239 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:03,240 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:03,240 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:04,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:04,216 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:04,247 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:04,277 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:04,308 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:04,339 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:04,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:04,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:04,431 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:04,462 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:04,770 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5295369625091553 s; generated tokens: 20 tokens; generate speed: 13.075852686286611 tokens/s +2024-07-30 14:01:04,774 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:04,775 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[643/2067], cost time 1.5406s, every example cost time is 1.5406, generate speed: 12.9817 tokens/s, avg speed: 10.3755 tokens/s, remaining time: 0:32:28 +pred is: + ['1'] + label is: + ['Paleoclimatologists'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:01:04,857 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:04,857 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:04,858 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:04,858 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:04,858 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:05,801 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:05,832 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:05,863 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:05,894 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:05,896 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0377624034881592 s; generated tokens: 4 tokens; generate speed: 3.854446823815428 tokens/s +2024-07-30 14:01:05,901 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:05,901 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[644/2067], cost time 1.0486s, every example cost time is 1.0486, generate speed: 3.8145 tokens/s, avg speed: 10.3676 tokens/s, remaining time: 0:32:26 +pred is: + ['687 nm'] + label is: + ['687 and 760 nm'] +The F1/Em of this example is: {'F1': 40.0, 'Em': 0.0} +2024-07-30 14:01:05,983 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:05,983 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 146, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:05,984 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:05,984 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:05,984 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:06,926 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:06,959 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:06,990 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:06,992 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0081641674041748 s; generated tokens: 3 tokens; generate speed: 2.9757058393817073 tokens/s +2024-07-30 14:01:06,997 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:06,997 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[645/2067], cost time 1.0190s, every example cost time is 1.0190, generate speed: 2.9439 tokens/s, avg speed: 10.3591 tokens/s, remaining time: 0:32:24 +pred is: + ['1'] + label is: + ['paramagnetic'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:01:07,085 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:07,085 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 189, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:07,086 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:07,086 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:07,086 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:08,029 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:08,060 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:08,091 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:08,122 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:08,152 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:08,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:08,214 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:08,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:08,275 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:08,306 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:08,613 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.527050256729126 s; generated tokens: 20 tokens; generate speed: 13.097145894097235 tokens/s +2024-07-30 14:01:08,618 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:08,618 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[646/2067], cost time 1.5385s, every example cost time is 1.5385, generate speed: 13.0001 tokens/s, avg speed: 10.3637 tokens/s, remaining time: 0:32:23 +pred is: + ['1'] + label is: + ['dangerous by-products'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:01:08,700 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:08,701 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 194, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:08,701 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:08,701 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:08,701 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:09,645 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:09,678 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:09,709 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:09,740 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:09,773 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:09,804 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:09,835 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:09,865 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:09,896 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:09,927 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:10,235 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5338108539581299 s; generated tokens: 20 tokens; generate speed: 13.039417440806533 tokens/s +2024-07-30 14:01:10,240 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:10,240 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[647/2067], cost time 1.5449s, every example cost time is 1.5449, generate speed: 12.9455 tokens/s, avg speed: 10.3682 tokens/s, remaining time: 0:32:22 +pred is: + ['90.20'] + label is: + ['90.20 K'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:01:10,322 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:10,322 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 183, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:10,323 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:10,323 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:10,323 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:11,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:11,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:11,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:11,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:11,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:11,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:11,452 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:11,483 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:11,514 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:11,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:11,855 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5314297676086426 s; generated tokens: 20 tokens; generate speed: 13.059691291772648 tokens/s +2024-07-30 14:01:11,860 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:11,860 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[648/2067], cost time 1.5425s, every example cost time is 1.5425, generate speed: 12.9658 tokens/s, avg speed: 10.3727 tokens/s, remaining time: 0:32:21 +pred is: + ['1'] + label is: + ['water'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:01:11,953 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:11,954 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 179, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:11,954 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:11,954 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:11,954 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:12,897 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:12,930 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:12,961 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:12,992 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:13,022 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:13,053 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:13,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:13,114 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:13,145 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:13,175 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:13,485 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5305259227752686 s; generated tokens: 20 tokens; generate speed: 13.067403630599372 tokens/s +2024-07-30 14:01:13,490 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:13,490 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[649/2067], cost time 1.5420s, every example cost time is 1.5420, generate speed: 12.9702 tokens/s, avg speed: 10.3772 tokens/s, remaining time: 0:32:20 +pred is: + ['3.5 billion years ago'] + label is: + ['3.5 billion years ago'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:01:13,572 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:13,572 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 168, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:13,573 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:13,573 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:13,573 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:14,515 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:14,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:14,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:14,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:14,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:14,669 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:14,700 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:14,730 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:14,761 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:14,792 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:15,106 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5322277545928955 s; generated tokens: 20 tokens; generate speed: 13.052889780941143 tokens/s +2024-07-30 14:01:15,110 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:15,111 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[650/2067], cost time 1.5433s, every example cost time is 1.5433, generate speed: 12.9593 tokens/s, avg speed: 10.3817 tokens/s, remaining time: 0:32:19 +pred is: + ['Photosynthesis'] + label is: + ['oxygen cycle'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 63.418399104184665, Em score: 51.07692307692308, current_count: 650 +2024-07-30 14:01:15,352 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:15,352 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 214, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:15,353 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:15,353 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:15,353 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:16,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:16,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:16,360 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:16,391 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:16,422 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:16,453 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:16,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:16,515 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:16,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:16,576 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:16,884 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5307154655456543 s; generated tokens: 20 tokens; generate speed: 13.06578554288703 tokens/s +2024-07-30 14:01:16,889 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:16,889 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[651/2067], cost time 1.5418s, every example cost time is 1.5418, generate speed: 12.9715 tokens/s, avg speed: 10.3862 tokens/s, remaining time: 0:32:18 +pred is: + ['1'] + label is: + ['zeolite molecular sieves'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:01:16,971 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:16,972 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 260, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:16,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:16,972 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:16,973 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:17,916 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:17,948 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:17,980 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:18,010 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:18,041 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:18,044 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0711543560028076 s; generated tokens: 5 tokens; generate speed: 4.667861332943965 tokens/s +2024-07-30 14:01:18,049 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:18,049 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[652/2067], cost time 1.0822s, every example cost time is 1.0822, generate speed: 4.6204 tokens/s, avg speed: 10.3792 tokens/s, remaining time: 0:32:16 +pred is: + ['1'] + label is: + ['water'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:01:18,131 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:18,131 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 178, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:18,132 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:18,132 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:18,132 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:19,074 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:19,106 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:19,137 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:19,168 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:19,199 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:19,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:19,260 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:19,291 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:19,321 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:19,352 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:19,665 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5325431823730469 s; generated tokens: 20 tokens; generate speed: 13.050203237360826 tokens/s +2024-07-30 14:01:19,670 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:19,670 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[653/2067], cost time 1.5438s, every example cost time is 1.5438, generate speed: 12.9548 tokens/s, avg speed: 10.3836 tokens/s, remaining time: 0:32:15 +pred is: + ['1'] + label is: + ['recreational'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:01:19,752 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:19,752 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 210, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:19,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:19,753 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:19,753 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:20,696 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:20,728 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:20,759 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:20,762 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.008685827255249 s; generated tokens: 3 tokens; generate speed: 2.974166900077646 tokens/s +2024-07-30 14:01:20,767 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:20,767 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[654/2067], cost time 1.0197s, every example cost time is 1.0197, generate speed: 2.9420 tokens/s, avg speed: 10.3751 tokens/s, remaining time: 0:32:13 +pred is: + ['oxygen chamber'] + label is: + ['Hyperbaric (high-pressure) medicine'] +The F1/Em of this example is: {'F1': 20.0, 'Em': 0.0} +2024-07-30 14:01:20,848 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:20,849 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 169, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:20,849 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:20,849 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:20,850 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:21,792 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:21,825 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:21,856 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:21,886 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:21,917 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:21,920 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0698230266571045 s; generated tokens: 5 tokens; generate speed: 4.673670200971081 tokens/s +2024-07-30 14:01:21,924 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:21,925 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[655/2067], cost time 1.0808s, every example cost time is 1.0808, generate speed: 4.6261 tokens/s, avg speed: 10.3682 tokens/s, remaining time: 0:32:11 +pred is: + ['Oxygen therapy'] + label is: + ['Oxygen therapy'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:01:22,007 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:22,007 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 172, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:22,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:22,008 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:22,008 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:22,950 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:22,982 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:23,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:23,044 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:23,074 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:23,105 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:23,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:23,166 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:23,197 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:23,228 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:23,534 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5262031555175781 s; generated tokens: 20 tokens; generate speed: 13.104415311746253 tokens/s +2024-07-30 14:01:23,539 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:23,539 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[656/2067], cost time 1.5374s, every example cost time is 1.5374, generate speed: 13.0094 tokens/s, avg speed: 10.3727 tokens/s, remaining time: 0:32:10 +pred is: + ['1'] + label is: + ['electronegativity'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:01:23,621 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:23,621 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:23,622 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:23,622 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:23,622 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:24,565 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:24,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:24,628 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:24,660 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:24,690 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:24,721 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:24,752 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:24,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:24,813 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:24,843 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:25,151 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5285577774047852 s; generated tokens: 20 tokens; generate speed: 13.084229000461066 tokens/s +2024-07-30 14:01:25,164 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:25,164 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[657/2067], cost time 1.5477s, every example cost time is 1.5477, generate speed: 12.9220 tokens/s, avg speed: 10.3771 tokens/s, remaining time: 0:32:09 +pred is: + ['Cabin depressurization'] + label is: + ['cabin depressurization'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:01:25,246 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:25,246 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 211, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:25,247 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:25,247 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:25,247 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:26,191 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:26,222 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:26,253 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:26,284 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:26,315 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:26,345 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:26,376 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:26,407 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:26,438 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:26,468 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:26,776 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5283360481262207 s; generated tokens: 20 tokens; generate speed: 13.086127245719627 tokens/s +2024-07-30 14:01:26,781 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:26,781 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[658/2067], cost time 1.5397s, every example cost time is 1.5397, generate speed: 12.9898 tokens/s, avg speed: 10.3816 tokens/s, remaining time: 0:32:08 +pred is: + ['1'] + label is: + ['storage'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:01:26,863 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:26,863 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 300, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:26,863 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:26,864 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:26,864 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:27,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:27,841 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:27,872 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:27,903 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:27,934 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:27,937 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0726845264434814 s; generated tokens: 5 tokens; generate speed: 4.661202689832447 tokens/s +2024-07-30 14:01:27,941 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:27,942 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[659/2067], cost time 1.0837s, every example cost time is 1.0837, generate speed: 4.6139 tokens/s, avg speed: 10.3747 tokens/s, remaining time: 0:32:06 +pred is: + ['Alcohols'] + label is: + ['organic solvents'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:01:28,024 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:28,024 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 203, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:28,024 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:28,025 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:28,025 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:28,967 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:28,999 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:29,030 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:29,060 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:29,091 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:29,094 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0689785480499268 s; generated tokens: 5 tokens; generate speed: 4.677362337271593 tokens/s +2024-07-30 14:01:29,098 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:29,099 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[660/2067], cost time 1.0799s, every example cost time is 1.0799, generate speed: 4.6300 tokens/s, avg speed: 10.3678 tokens/s, remaining time: 0:32:04 +pred is: + ['Carbohydrates'] + label is: + ['biomolecules'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 62.790847602606114, Em score: 50.60606060606061, current_count: 660 +2024-07-30 14:01:29,342 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:29,342 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 193, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:29,342 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:29,342 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:29,343 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:30,285 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:30,318 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:30,349 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:30,380 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:30,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:30,441 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:30,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:30,502 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:30,533 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:30,564 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:30,871 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5282111167907715 s; generated tokens: 20 tokens; generate speed: 13.087197037278335 tokens/s +2024-07-30 14:01:30,876 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:30,876 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[661/2067], cost time 1.5394s, every example cost time is 1.5394, generate speed: 12.9925 tokens/s, avg speed: 10.3722 tokens/s, remaining time: 0:32:03 +pred is: + ['1'] + label is: + ['Oxygen toxicity'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:01:30,958 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:30,958 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 164, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:30,959 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:30,959 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:30,959 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:31,902 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:31,935 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:31,967 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:31,997 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:32,029 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:32,059 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:32,090 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:32,121 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:32,152 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:32,182 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:32,490 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5310330390930176 s; generated tokens: 20 tokens; generate speed: 13.06307538069066 tokens/s +2024-07-30 14:01:32,495 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:32,495 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[662/2067], cost time 1.5420s, every example cost time is 1.5420, generate speed: 12.9698 tokens/s, avg speed: 10.3767 tokens/s, remaining time: 0:32:02 +pred is: + ['1'] + label is: + ['low total pressures'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:01:32,577 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:32,577 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 194, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:32,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:32,578 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:32,578 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:33,520 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:33,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:33,583 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:33,614 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:33,645 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:33,675 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:33,706 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:33,737 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:33,768 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:33,799 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:34,106 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.528188705444336 s; generated tokens: 20 tokens; generate speed: 13.0873889649543 tokens/s +2024-07-30 14:01:34,111 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:34,111 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[663/2067], cost time 1.5392s, every example cost time is 1.5392, generate speed: 12.9939 tokens/s, avg speed: 10.3811 tokens/s, remaining time: 0:32:01 +pred is: + ['50% oxygen composition at standard pressure'] + label is: + ['at elevated partial pressures'] +The F1/Em of this example is: {'F1': 22.22222222222222, 'Em': 0.0} +2024-07-30 14:01:34,193 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:34,194 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 184, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:34,194 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:34,194 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:34,195 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:35,137 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:35,169 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:35,200 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:35,231 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:35,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:35,292 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:35,323 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:35,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:35,384 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:35,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:35,539 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3444693088531494 s; generated tokens: 14 tokens; generate speed: 10.413030559947991 tokens/s +2024-07-30 14:01:35,544 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:35,544 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[664/2067], cost time 1.3554s, every example cost time is 1.3554, generate speed: 10.3288 tokens/s, avg speed: 10.3810 tokens/s, remaining time: 0:32:00 +pred is: + ['October 1973'] + label is: + ['October 1973'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:01:35,626 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:35,626 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 203, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:35,627 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:35,627 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:35,627 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:36,570 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:36,602 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:36,633 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:36,663 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:36,694 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:36,725 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:36,755 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:36,786 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:36,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:36,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:37,155 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5277040004730225 s; generated tokens: 20 tokens; generate speed: 13.091541289286019 tokens/s +2024-07-30 14:01:37,160 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:37,160 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[665/2067], cost time 1.5387s, every example cost time is 1.5387, generate speed: 12.9976 tokens/s, avg speed: 10.3855 tokens/s, remaining time: 0:31:59 +pred is: + ['1'] + label is: + ['to avoid being targeted by the boycott'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:01:37,243 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:37,243 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 247, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:37,243 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:37,244 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:37,244 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:38,187 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:38,219 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:38,250 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:38,281 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:38,311 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:38,342 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:38,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:38,404 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:38,434 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:38,465 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:38,773 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5288195610046387 s; generated tokens: 20 tokens; generate speed: 13.081988555181312 tokens/s +2024-07-30 14:01:38,778 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:38,778 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[666/2067], cost time 1.5399s, every example cost time is 1.5399, generate speed: 12.9883 tokens/s, avg speed: 10.3898 tokens/s, remaining time: 0:31:58 +pred is: + ['August 15, 1971'] + label is: + ['On August 15, 1971'] +The F1/Em of this example is: {'F1': 85.71428571428571, 'Em': 0.0} +2024-07-30 14:01:38,860 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:38,860 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 180, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:38,860 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:38,861 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:38,861 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:39,804 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:39,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:39,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:39,898 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:39,929 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:39,960 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:39,991 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:40,021 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:40,024 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1633949279785156 s; generated tokens: 8 tokens; generate speed: 6.876426746935015 tokens/s +2024-07-30 14:01:40,029 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:40,029 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[667/2067], cost time 1.1744s, every example cost time is 1.1744, generate speed: 6.8119 tokens/s, avg speed: 10.3852 tokens/s, remaining time: 0:31:56 +pred is: + ['less than two percent per year'] + label is: + ['risen by less than two percent per year'] +The F1/Em of this example is: {'F1': 84.6153846153846, 'Em': 0.0} +2024-07-30 14:01:40,112 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:40,112 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 237, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:40,112 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:40,113 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:40,113 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:41,057 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:41,090 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:41,121 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:41,152 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:41,182 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:41,213 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:41,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:41,274 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:41,305 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:41,336 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:41,644 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5311145782470703 s; generated tokens: 20 tokens; generate speed: 13.062379709621363 tokens/s +2024-07-30 14:01:41,649 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:41,649 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[668/2067], cost time 1.5423s, every example cost time is 1.5423, generate speed: 12.9675 tokens/s, avg speed: 10.3896 tokens/s, remaining time: 0:31:55 +pred is: + ['October 6, 1973'] + label is: + ['On October 6, 1973'] +The F1/Em of this example is: {'F1': 85.71428571428571, 'Em': 0.0} +2024-07-30 14:01:41,732 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:41,732 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 267, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:41,733 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:41,733 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:41,733 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:42,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:42,709 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:42,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:42,770 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:42,801 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:42,831 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:42,862 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:42,893 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:42,923 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:42,954 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:43,262 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5284454822540283 s; generated tokens: 20 tokens; generate speed: 13.085190301001518 tokens/s +2024-07-30 14:01:43,266 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:43,267 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[669/2067], cost time 1.5396s, every example cost time is 1.5396, generate speed: 12.9904 tokens/s, avg speed: 10.3940 tokens/s, remaining time: 0:31:54 +pred is: + ['1'] + label is: + ['In response to American aid to Israel'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:01:43,361 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:43,362 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:43,362 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:43,362 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:43,362 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:44,305 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:44,337 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:44,368 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:44,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:44,429 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:44,432 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.069162130355835 s; generated tokens: 5 tokens; generate speed: 4.676559202799221 tokens/s +2024-07-30 14:01:44,436 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:44,437 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[670/2067], cost time 1.0807s, every example cost time is 1.0807, generate speed: 4.6266 tokens/s, avg speed: 10.3872 tokens/s, remaining time: 0:31:52 +pred is: + ['100 billion dollars'] + label is: + ['over 100 billion dollars'] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +F1 score: 62.542625267641114, Em score: 50.0, current_count: 670 +2024-07-30 14:01:44,684 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:44,685 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:44,685 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:44,685 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:44,685 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:45,628 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:45,659 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:45,690 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:45,721 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:45,751 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:45,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:45,812 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:45,843 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:45,873 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:45,904 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:46,211 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5251061916351318 s; generated tokens: 20 tokens; generate speed: 13.11384093100897 tokens/s +2024-07-30 14:01:46,215 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:46,216 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[671/2067], cost time 1.5363s, every example cost time is 1.5363, generate speed: 13.0181 tokens/s, avg speed: 10.3916 tokens/s, remaining time: 0:31:51 +pred is: + ['The possibility that the Middle East could become another superpower confrontation with the USSR was of more concern'] + label is: + ['distribution and price disruptions'] +The F1/Em of this example is: {'F1': 4.761904761904761, 'Em': 0.0} +2024-07-30 14:01:46,299 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:46,299 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 146, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:46,300 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:46,300 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:46,300 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:47,242 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:47,274 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:47,305 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:47,335 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:47,366 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:47,396 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:47,427 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:47,458 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:47,488 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:47,519 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:47,825 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5252282619476318 s; generated tokens: 20 tokens; generate speed: 13.112791376197757 tokens/s +2024-07-30 14:01:47,830 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:47,830 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[672/2067], cost time 1.5363s, every example cost time is 1.5363, generate speed: 13.0185 tokens/s, avg speed: 10.3960 tokens/s, remaining time: 0:31:50 +pred is: + ['1'] + label is: + ['The embargo'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:01:47,913 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:47,913 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 170, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:47,914 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:47,914 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:47,914 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:48,857 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:48,890 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:48,921 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:48,951 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:48,954 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0397963523864746 s; generated tokens: 4 tokens; generate speed: 3.8469071283232084 tokens/s +2024-07-30 14:01:48,959 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:48,959 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[673/2067], cost time 1.0509s, every example cost time is 1.0509, generate speed: 3.8062 tokens/s, avg speed: 10.3884 tokens/s, remaining time: 0:31:48 +pred is: + ['Netherlands'] + label is: + ['Netherlands'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:01:49,041 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:49,041 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 156, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:49,042 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:49,042 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:49,042 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:49,985 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:50,018 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:50,048 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:50,079 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:50,082 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0390918254852295 s; generated tokens: 4 tokens; generate speed: 3.8495154151868163 tokens/s +2024-07-30 14:01:50,086 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:50,087 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[674/2067], cost time 1.0501s, every example cost time is 1.0501, generate speed: 3.8090 tokens/s, avg speed: 10.3810 tokens/s, remaining time: 0:31:46 +pred is: + ['Norway'] + label is: + ['UK'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:01:50,171 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:50,172 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:50,172 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:50,173 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:50,173 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:51,116 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:51,148 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:51,179 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:51,210 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:51,241 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:51,272 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:51,303 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:51,334 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:51,365 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:51,396 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:51,704 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5310516357421875 s; generated tokens: 20 tokens; generate speed: 13.06291671234515 tokens/s +2024-07-30 14:01:51,709 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:51,709 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[675/2067], cost time 1.5432s, every example cost time is 1.5432, generate speed: 12.9599 tokens/s, avg speed: 10.3853 tokens/s, remaining time: 0:31:45 +pred is: + ['1'] + label is: + ['Price controls'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:01:51,791 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:51,791 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 153, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:51,791 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:51,791 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:51,792 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:52,733 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:52,765 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:52,796 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:52,827 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:52,858 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:52,888 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:52,919 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:52,950 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:52,980 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:53,011 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:53,319 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.527285099029541 s; generated tokens: 20 tokens; generate speed: 13.095132017400214 tokens/s +2024-07-30 14:01:53,324 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:53,324 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[676/2067], cost time 1.5384s, every example cost time is 1.5384, generate speed: 13.0003 tokens/s, avg speed: 10.3896 tokens/s, remaining time: 0:31:44 +pred is: + ['1'] + label is: + ['William E. Simon'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:01:53,406 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:53,406 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 166, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:53,407 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:53,407 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:53,407 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:54,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:54,384 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:54,416 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:54,446 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:54,449 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0418970584869385 s; generated tokens: 4 tokens; generate speed: 3.8391508714007423 tokens/s +2024-07-30 14:01:54,454 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:54,454 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[677/2067], cost time 1.0529s, every example cost time is 1.0529, generate speed: 3.7990 tokens/s, avg speed: 10.3821 tokens/s, remaining time: 0:31:42 +pred is: + ['55 mph'] + label is: + ['55 mph'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:01:54,535 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:54,536 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 145, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:54,536 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:54,536 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:54,537 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:55,478 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:55,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:55,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:55,575 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:55,605 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:55,637 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:55,667 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:55,698 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:55,729 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:55,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:56,068 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5311625003814697 s; generated tokens: 20 tokens; generate speed: 13.061970884878159 tokens/s +2024-07-30 14:01:56,073 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:56,073 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[678/2067], cost time 1.5422s, every example cost time is 1.5422, generate speed: 12.9681 tokens/s, avg speed: 10.3864 tokens/s, remaining time: 0:31:41 +pred is: + ['The energy crisis'] + label is: + ['energy crisis'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:01:56,155 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:56,155 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 305, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:56,156 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:56,156 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:56,156 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:57,101 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:57,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:57,166 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:57,197 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:57,228 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:57,259 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:57,290 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:57,321 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:57,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:57,382 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:57,692 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5353758335113525 s; generated tokens: 20 tokens; generate speed: 13.026126609183809 tokens/s +2024-07-30 14:01:57,697 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:57,697 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[679/2067], cost time 1.5464s, every example cost time is 1.5464, generate speed: 12.9329 tokens/s, avg speed: 10.3907 tokens/s, remaining time: 0:31:40 +pred is: + ['United States'] + label is: + ['U.S'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:01:57,779 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:57,779 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 195, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:57,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:57,780 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:57,780 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:01:58,723 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:58,755 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:58,786 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:58,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:58,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:58,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:58,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:58,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:58,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:59,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:59,312 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5322487354278564 s; generated tokens: 20 tokens; generate speed: 13.052711049825284 tokens/s +2024-07-30 14:01:59,317 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:01:59,317 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[680/2067], cost time 1.5434s, every example cost time is 1.5434, generate speed: 12.9581 tokens/s, avg speed: 10.3949 tokens/s, remaining time: 0:31:39 +pred is: + ['Japan'] + label is: + ['Japan'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.181354167766834, Em score: 49.705882352941174, current_count: 680 +2024-07-30 14:01:59,568 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:01:59,568 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 386, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:01:59,569 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:01:59,569 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:01:59,569 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:00,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:00,549 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:00,580 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:00,612 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:00,643 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:00,674 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:00,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:00,736 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:00,767 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:00,798 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:01,108 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5390243530273438 s; generated tokens: 20 tokens; generate speed: 12.995245956088299 tokens/s +2024-07-30 14:02:01,113 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:01,113 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[681/2067], cost time 1.5506s, every example cost time is 1.5506, generate speed: 12.8982 tokens/s, avg speed: 10.3991 tokens/s, remaining time: 0:31:38 +pred is: + ['Iran'] + label is: + ["USSR's invasion"] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:02:01,196 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:01,196 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 158, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:01,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:01,197 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:01,197 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:02,139 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:02,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:02,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:02,233 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:02,264 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:02,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:02,325 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:02,356 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:02,387 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:02,418 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:02,725 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5285184383392334 s; generated tokens: 20 tokens; generate speed: 13.084565745723296 tokens/s +2024-07-30 14:02:02,730 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:02,730 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[682/2067], cost time 1.5396s, every example cost time is 1.5396, generate speed: 12.9901 tokens/s, avg speed: 10.4033 tokens/s, remaining time: 0:31:37 +pred is: + ['Small cars'] + label is: + ['large cars'] +The F1/Em of this example is: {'F1': 66.66666666666666, 'Em': 0.0} +2024-07-30 14:02:02,813 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:02,813 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 196, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:02,813 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:02,813 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:02,814 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:03,757 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:03,791 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:03,823 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:03,855 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:03,886 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:03,917 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:03,947 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:03,978 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:04,009 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:04,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:04,349 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5354321002960205 s; generated tokens: 20 tokens; generate speed: 13.025649259347997 tokens/s +2024-07-30 14:02:04,354 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:04,354 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[683/2067], cost time 1.5465s, every example cost time is 1.5465, generate speed: 12.9323 tokens/s, avg speed: 10.4075 tokens/s, remaining time: 0:31:36 +pred is: + ['1981'] + label is: + ['A decade after the 1973'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:02:04,437 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:04,437 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 156, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:04,438 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:04,438 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:04,438 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:05,380 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:05,412 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:05,443 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:05,474 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:05,504 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:05,535 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:05,566 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:05,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:05,628 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:05,658 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:05,966 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5275657176971436 s; generated tokens: 20 tokens; generate speed: 13.092726400112376 tokens/s +2024-07-30 14:02:05,970 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:05,971 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[684/2067], cost time 1.5386s, every example cost time is 1.5386, generate speed: 12.9985 tokens/s, avg speed: 10.4118 tokens/s, remaining time: 0:31:35 +pred is: + ['Hilux'] + label is: + ['Toyota Hilux'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:02:06,054 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:06,054 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 302, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:06,055 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:06,055 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:06,055 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:07,000 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:07,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:07,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:07,095 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:07,126 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:07,157 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:07,188 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:07,219 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:07,250 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:07,280 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:07,406 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.35105562210083 s; generated tokens: 14 tokens; generate speed: 10.362267674983386 tokens/s +2024-07-30 14:02:07,411 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:07,412 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[685/2067], cost time 1.3628s, every example cost time is 1.3628, generate speed: 10.2729 tokens/s, avg speed: 10.4116 tokens/s, remaining time: 0:31:33 +pred is: + ['1'] + label is: + ['An increase in imported cars'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:02:07,494 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:07,494 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 197, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:07,495 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:07,495 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:07,495 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:08,438 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:08,470 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:08,501 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:08,532 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:08,563 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:08,594 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:08,625 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:08,656 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:08,687 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:08,719 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:08,752 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2569608688354492 s; generated tokens: 11 tokens; generate speed: 8.75126686337602 tokens/s +2024-07-30 14:02:08,757 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:08,757 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[686/2067], cost time 1.2682s, every example cost time is 1.2682, generate speed: 8.6735 tokens/s, avg speed: 10.4092 tokens/s, remaining time: 0:31:32 +pred is: + ['1979'] + label is: + ['1979'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:02:08,839 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:08,839 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 180, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:08,840 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:08,840 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:08,840 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:09,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:09,815 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:09,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:09,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:09,909 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:09,943 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:09,979 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:10,010 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:10,041 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:10,072 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:10,381 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5402858257293701 s; generated tokens: 20 tokens; generate speed: 12.98460303010931 tokens/s +2024-07-30 14:02:10,385 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:10,386 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[687/2067], cost time 1.5514s, every example cost time is 1.5514, generate speed: 12.8917 tokens/s, avg speed: 10.4133 tokens/s, remaining time: 0:31:31 +pred is: + ['1981'] + label is: + ['1981'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:02:10,469 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:10,469 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:10,469 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:10,470 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:10,470 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:11,413 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:11,446 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:11,477 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:11,508 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:11,539 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:11,570 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:11,601 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:11,632 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:11,663 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:11,694 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:12,029 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.55934476852417 s; generated tokens: 20 tokens; generate speed: 12.825899957280678 tokens/s +2024-07-30 14:02:12,034 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:12,034 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[688/2067], cost time 1.5705s, every example cost time is 1.5705, generate speed: 12.7344 tokens/s, avg speed: 10.4172 tokens/s, remaining time: 0:31:30 +pred is: + ['Project Mercury'] + label is: + ['Project Mercury'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:02:12,116 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:12,116 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:12,116 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:12,117 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:12,117 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:13,059 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:13,092 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:13,124 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:13,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:13,185 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:13,216 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:13,247 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:13,250 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1329681873321533 s; generated tokens: 7 tokens; generate speed: 6.178461212122105 tokens/s +2024-07-30 14:02:13,255 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:13,255 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[689/2067], cost time 1.1439s, every example cost time is 1.1439, generate speed: 6.1193 tokens/s, avg speed: 10.4120 tokens/s, remaining time: 0:31:28 +pred is: + ['1961-1972'] + label is: + ['1961 to 1972'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:02:13,337 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:13,337 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 188, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:13,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:13,338 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:13,338 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:14,280 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:14,312 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:14,343 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:14,374 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:14,405 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:14,436 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:14,467 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:14,498 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:14,529 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:14,559 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:14,868 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.529672384262085 s; generated tokens: 20 tokens; generate speed: 13.074695082272806 tokens/s +2024-07-30 14:02:14,873 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:14,873 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[690/2067], cost time 1.5407s, every example cost time is 1.5407, generate speed: 12.9815 tokens/s, avg speed: 10.4162 tokens/s, remaining time: 0:31:27 +pred is: + ['1967'] + label is: + ['1967'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.02896739238857, Em score: 49.56521739130435, current_count: 690 +2024-07-30 14:02:15,126 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:15,127 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 193, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:15,127 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:15,127 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:15,127 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:16,070 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:16,103 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:16,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:16,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:16,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:16,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:16,257 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:16,288 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:16,319 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:16,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:16,659 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.530963659286499 s; generated tokens: 20 tokens; generate speed: 13.06366736968854 tokens/s +2024-07-30 14:02:16,663 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:16,664 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[691/2067], cost time 1.5421s, every example cost time is 1.5421, generate speed: 12.9695 tokens/s, avg speed: 10.4203 tokens/s, remaining time: 0:31:26 +pred is: + ['Apollo 8'] + label is: + ['Apollo 8'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:02:16,770 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:16,770 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 194, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:16,771 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:16,771 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:16,771 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:17,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:17,746 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:17,778 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:17,780 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0087614059448242 s; generated tokens: 3 tokens; generate speed: 2.9739440687564227 tokens/s +2024-07-30 14:02:17,785 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:17,785 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[692/2067], cost time 1.0202s, every example cost time is 1.0202, generate speed: 2.9407 tokens/s, avg speed: 10.4123 tokens/s, remaining time: 0:31:24 +pred is: + ['1'] + label is: + ['one'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:02:17,868 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:17,868 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 185, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:17,869 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:17,869 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:17,869 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:18,812 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:18,844 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:18,875 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:18,906 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:18,937 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:18,968 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:18,999 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:19,030 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:19,061 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:19,092 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:19,401 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5320658683776855 s; generated tokens: 20 tokens; generate speed: 13.054269018588691 tokens/s +2024-07-30 14:02:19,406 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:19,406 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[693/2067], cost time 1.5432s, every example cost time is 1.5432, generate speed: 12.9601 tokens/s, avg speed: 10.4164 tokens/s, remaining time: 0:31:23 +pred is: + ['1960'] + label is: + ['1960'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:02:19,489 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:19,489 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 256, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:19,489 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:19,489 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:19,490 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:20,434 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:20,468 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:20,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:20,532 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:20,563 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:20,593 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:20,624 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:20,673 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:20,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:20,736 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:21,045 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5551207065582275 s; generated tokens: 20 tokens; generate speed: 12.860738022236058 tokens/s +2024-07-30 14:02:21,050 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:21,050 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[694/2067], cost time 1.5663s, every example cost time is 1.5663, generate speed: 12.7690 tokens/s, avg speed: 10.4203 tokens/s, remaining time: 0:31:22 +pred is: + ['John F. Kennedy'] + label is: + ['John F. Kennedy'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:02:21,132 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:21,132 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 155, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:21,133 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:21,133 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:21,133 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:22,075 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:22,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:22,139 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:22,170 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:22,200 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:22,231 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:22,262 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:22,264 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1313166618347168 s; generated tokens: 7 tokens; generate speed: 6.187480690550182 tokens/s +2024-07-30 14:02:22,269 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:22,269 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[695/2067], cost time 1.1423s, every example cost time is 1.1423, generate speed: 6.1280 tokens/s, avg speed: 10.4151 tokens/s, remaining time: 0:31:20 +pred is: + ['Yuri Gagarin'] + label is: + ['Yuri Gagarin'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:02:22,351 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:22,352 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 156, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:22,352 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:22,352 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:22,352 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:23,294 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:23,327 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:23,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:23,388 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:23,419 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:23,450 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:23,481 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:23,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:23,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:23,574 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:23,884 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5311617851257324 s; generated tokens: 20 tokens; generate speed: 13.061976986551873 tokens/s +2024-07-30 14:02:23,889 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:23,889 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[696/2067], cost time 1.5423s, every example cost time is 1.5423, generate speed: 12.9680 tokens/s, avg speed: 10.4193 tokens/s, remaining time: 0:31:19 +pred is: + ['April 20'] + label is: + ['April 20'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:02:23,970 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:23,971 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 186, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:23,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:23,971 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:23,972 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:24,914 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:24,947 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:24,979 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:25,010 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:25,041 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:25,072 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:25,103 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:25,133 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:25,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:25,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:25,508 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.536423683166504 s; generated tokens: 20 tokens; generate speed: 13.017242717048497 tokens/s +2024-07-30 14:02:25,513 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:25,513 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[697/2067], cost time 1.5477s, every example cost time is 1.5477, generate speed: 12.9228 tokens/s, avg speed: 10.4233 tokens/s, remaining time: 0:31:18 +pred is: + ['Robert R. Gilruth'] + label is: + ['Robert R. Gilruth'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:02:25,596 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:25,596 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 243, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:25,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:25,597 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:25,597 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:26,541 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:26,574 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:26,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:26,638 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:26,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:26,724 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:26,755 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:26,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:26,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:26,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:27,157 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5596985816955566 s; generated tokens: 20 tokens; generate speed: 12.822990438484526 tokens/s +2024-07-30 14:02:27,162 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:27,162 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[698/2067], cost time 1.5710s, every example cost time is 1.5710, generate speed: 12.7311 tokens/s, avg speed: 10.4271 tokens/s, remaining time: 0:31:17 +pred is: + ['Immediately north of Canaveral at Merritt Island'] + label is: + ['Merritt Island'] +The F1/Em of this example is: {'F1': 37.5, 'Em': 0.0} +2024-07-30 14:02:27,245 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:27,245 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 205, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:27,245 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:27,246 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:27,246 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:28,189 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:28,223 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:28,255 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:28,287 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:28,318 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:28,349 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:28,408 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:28,439 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:28,442 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1960577964782715 s; generated tokens: 8 tokens; generate speed: 6.688639983415161 tokens/s +2024-07-30 14:02:28,447 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:28,447 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[699/2067], cost time 1.2075s, every example cost time is 1.2075, generate speed: 6.6255 tokens/s, avg speed: 10.4223 tokens/s, remaining time: 0:31:15 +pred is: + ['3'] + label is: + ['three'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:02:28,528 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:28,529 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 222, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:28,529 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:28,529 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:28,530 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:29,473 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:29,506 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:29,537 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:29,574 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:29,605 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:29,636 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:29,667 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:29,698 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:29,729 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:29,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:29,947 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4175422191619873 s; generated tokens: 16 tokens; generate speed: 11.287141775190843 tokens/s +2024-07-30 14:02:29,952 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:29,952 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[700/2067], cost time 1.4287s, every example cost time is 1.4287, generate speed: 11.1990 tokens/s, avg speed: 10.4235 tokens/s, remaining time: 0:31:14 +pred is: + ['Dr. George E. Mueller'] + label is: + ['Dr. George E. Mueller'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.19641071535445, Em score: 49.857142857142854, current_count: 700 +2024-07-30 14:02:30,206 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:30,206 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 189, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:30,207 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:30,207 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:30,207 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:31,150 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:31,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:31,215 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:31,246 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:31,277 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:31,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:31,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:31,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:31,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:31,431 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:31,743 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5351815223693848 s; generated tokens: 20 tokens; generate speed: 13.02777535332251 tokens/s +2024-07-30 14:02:31,748 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:31,748 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[701/2067], cost time 1.5466s, every example cost time is 1.5466, generate speed: 12.9316 tokens/s, avg speed: 10.4275 tokens/s, remaining time: 0:31:13 +pred is: + ['1'] + label is: + ['Air Force missile projects'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:02:31,830 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:31,830 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 219, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:31,831 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:31,831 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:31,831 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:32,774 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:32,806 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:32,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:32,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:32,900 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:32,931 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:32,962 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:32,992 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:33,023 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:33,054 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:33,363 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5320923328399658 s; generated tokens: 20 tokens; generate speed: 13.054043526819928 tokens/s +2024-07-30 14:02:33,368 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:33,368 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[702/2067], cost time 1.5433s, every example cost time is 1.5433, generate speed: 12.9596 tokens/s, avg speed: 10.4316 tokens/s, remaining time: 0:31:12 +pred is: + ['A rendezvous'] + label is: + ['a rendezvous —let alone a docking'] +The F1/Em of this example is: {'F1': 40.0, 'Em': 0.0} +2024-07-30 14:02:33,451 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:33,452 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 254, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:33,452 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:33,452 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:33,453 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:34,396 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:34,429 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:34,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:34,491 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:34,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:34,553 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:34,584 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:34,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:34,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:34,677 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:35,010 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.556816577911377 s; generated tokens: 20 tokens; generate speed: 12.846728563766948 tokens/s +2024-07-30 14:02:35,014 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:35,015 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[703/2067], cost time 1.5681s, every example cost time is 1.5681, generate speed: 12.7539 tokens/s, avg speed: 10.4353 tokens/s, remaining time: 0:31:11 +pred is: + ['Nicholas E. Golovin'] + label is: + ['Nicholas E. Golovin'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:02:35,096 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:35,097 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 187, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:35,097 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:35,097 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:35,098 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:36,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:36,072 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:36,126 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:36,157 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:36,188 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:36,219 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:36,250 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:36,281 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:36,312 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:36,342 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:36,650 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5526630878448486 s; generated tokens: 20 tokens; generate speed: 12.881094524994928 tokens/s +2024-07-30 14:02:36,655 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:36,655 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[704/2067], cost time 1.5638s, every example cost time is 1.5638, generate speed: 12.7894 tokens/s, avg speed: 10.4392 tokens/s, remaining time: 0:31:10 +pred is: + ['Jerome Wiesner'] + label is: + ['Jerome Wiesner'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:02:36,738 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:36,738 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 223, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:36,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:36,739 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:36,739 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:37,683 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:37,715 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:37,747 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:37,778 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:37,809 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:37,840 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:37,870 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:37,901 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:37,932 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:37,963 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:38,271 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5320756435394287 s; generated tokens: 20 tokens; generate speed: 13.054185727928969 tokens/s +2024-07-30 14:02:38,276 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:38,276 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[705/2067], cost time 1.5433s, every example cost time is 1.5433, generate speed: 12.9594 tokens/s, avg speed: 10.4432 tokens/s, remaining time: 0:31:09 +pred is: + ['Wiesner'] + label is: + ['Wiesner'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:02:38,359 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:38,359 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 186, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:38,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:38,360 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:38,360 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:39,302 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:39,335 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:39,367 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:39,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:39,430 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:39,461 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:39,492 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:39,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:39,563 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:39,594 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:39,910 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5497910976409912 s; generated tokens: 20 tokens; generate speed: 12.904965082353955 tokens/s +2024-07-30 14:02:39,915 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:39,915 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[706/2067], cost time 1.5610s, every example cost time is 1.5610, generate speed: 12.8120 tokens/s, avg speed: 10.4470 tokens/s, remaining time: 0:31:08 +pred is: + ['The LOR method had the advantage of allowing the lander spacecraft to be used as a "'] + label is: + ['spacecraft to be used as a "lifeboat"'] +The F1/Em of this example is: {'F1': 54.166666666666664, 'Em': 0.0} +2024-07-30 14:02:39,998 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:39,998 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 219, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:39,999 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:39,999 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:39,999 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:40,943 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:40,976 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:41,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:41,010 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0109148025512695 s; generated tokens: 3 tokens; generate speed: 2.967609132271908 tokens/s +2024-07-30 14:02:41,015 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:41,015 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[707/2067], cost time 1.0220s, every example cost time is 1.0220, generate speed: 2.9354 tokens/s, avg speed: 10.4391 tokens/s, remaining time: 0:31:06 +pred is: + ['cone'] + label is: + ['cone-shaped'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:02:41,097 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:41,097 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 199, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:41,098 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:41,098 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:41,098 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:42,041 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:42,074 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:42,106 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:42,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:42,169 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:42,200 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:42,231 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:42,284 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:42,288 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1899151802062988 s; generated tokens: 8 tokens; generate speed: 6.723168283820884 tokens/s +2024-07-30 14:02:42,293 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:42,293 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[708/2067], cost time 1.2010s, every example cost time is 1.2010, generate speed: 6.6610 tokens/s, avg speed: 10.4344 tokens/s, remaining time: 0:31:04 +pred is: + ['3'] + label is: + ['three'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:02:42,375 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:42,376 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 214, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:42,376 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:42,376 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:42,376 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:43,320 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:43,352 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:43,383 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:43,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:43,446 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:43,477 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:43,508 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:43,539 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:43,570 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:43,573 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1963584423065186 s; generated tokens: 9 tokens; generate speed: 7.522829013224879 tokens/s +2024-07-30 14:02:43,578 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:43,578 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[709/2067], cost time 1.2076s, every example cost time is 1.2076, generate speed: 7.4529 tokens/s, avg speed: 10.4307 tokens/s, remaining time: 0:31:02 +pred is: + ['A cylindrical Service Module (SM)'] + label is: + ['Service Module (SM)'] +The F1/Em of this example is: {'F1': 77.77777777777779, 'Em': 0.0} +2024-07-30 14:02:43,660 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:43,661 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 186, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:43,661 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:43,661 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:43,662 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:44,604 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:44,637 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:44,669 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:44,700 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:44,731 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:44,761 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:44,792 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:44,823 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:44,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:44,885 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:45,194 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.532362699508667 s; generated tokens: 20 tokens; generate speed: 13.05174030039543 tokens/s +2024-07-30 14:02:45,199 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:45,199 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[710/2067], cost time 1.5436s, every example cost time is 1.5436, generate speed: 12.9571 tokens/s, avg speed: 10.4347 tokens/s, remaining time: 0:31:01 +pred is: + ['1'] + label is: + ['North American Aviation'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 61.98511541576416, Em score: 49.57746478873239, current_count: 710 +2024-07-30 14:02:45,470 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:45,471 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 235, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:45,471 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:45,471 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:45,472 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:46,416 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:46,450 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:46,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:46,513 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:46,544 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:46,575 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:46,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:46,638 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:46,669 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:46,700 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:46,703 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2313954830169678 s; generated tokens: 10 tokens; generate speed: 8.1208678592028 tokens/s +2024-07-30 14:02:46,708 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:46,708 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[711/2067], cost time 1.2431s, every example cost time is 1.2431, generate speed: 8.0444 tokens/s, avg speed: 10.4317 tokens/s, remaining time: 0:31:00 +pred is: + ['2'] + label is: + ['two'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:02:46,790 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:46,791 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 213, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:46,791 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:46,791 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:46,792 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:47,735 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:47,767 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:47,799 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:47,830 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:47,861 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:47,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:47,923 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:47,954 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:47,985 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:48,016 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:48,326 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5340673923492432 s; generated tokens: 20 tokens; generate speed: 13.037236890468261 tokens/s +2024-07-30 14:02:48,331 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:48,331 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[712/2067], cost time 1.5454s, every example cost time is 1.5454, generate speed: 12.9418 tokens/s, avg speed: 10.4356 tokens/s, remaining time: 0:30:59 +pred is: + ['Wernher von Braun'] + label is: + ['Wernher von Braun'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:02:48,415 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:48,415 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 168, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:48,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:48,416 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:48,416 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:49,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:49,394 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:49,426 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:49,457 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:49,488 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:49,519 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:49,558 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:49,594 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:49,598 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1822307109832764 s; generated tokens: 8 tokens; generate speed: 6.766868704794767 tokens/s +2024-07-30 14:02:49,603 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:49,603 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[713/2067], cost time 1.1938s, every example cost time is 1.1938, generate speed: 6.7015 tokens/s, avg speed: 10.4311 tokens/s, remaining time: 0:30:57 +pred is: + ['Dummy upper stages filled with water'] + label is: + ['dummy upper stages filled with water'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:02:49,686 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:49,686 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 229, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:49,686 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:49,687 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:49,687 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:50,631 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:50,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:50,695 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:50,726 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:50,756 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:50,787 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:50,818 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:50,849 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:50,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:50,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:51,220 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5331485271453857 s; generated tokens: 20 tokens; generate speed: 13.045050525690806 tokens/s +2024-07-30 14:02:51,225 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:51,225 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[714/2067], cost time 1.5446s, every example cost time is 1.5446, generate speed: 12.9486 tokens/s, avg speed: 10.4350 tokens/s, remaining time: 0:30:56 +pred is: + ['Saturn IB'] + label is: + ['Saturn IB'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:02:51,307 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:51,307 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 249, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:51,308 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:51,308 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:51,308 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:52,252 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:52,285 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:52,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:52,348 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:52,379 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:52,410 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:52,441 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:52,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:52,502 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:52,533 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:52,567 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.259035587310791 s; generated tokens: 11 tokens; generate speed: 8.736845972316958 tokens/s +2024-07-30 14:02:52,572 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:52,572 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[715/2067], cost time 1.2703s, every example cost time is 1.2703, generate speed: 8.6594 tokens/s, avg speed: 10.4327 tokens/s, remaining time: 0:30:54 +pred is: + ['Saturn V'] + label is: + ['three-stage Saturn V'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:02:52,654 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:52,655 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 172, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:52,655 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:52,655 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:52,655 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:53,598 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:53,631 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:53,662 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:53,694 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:53,725 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:53,756 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:53,787 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:53,791 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.134916067123413 s; generated tokens: 7 tokens; generate speed: 6.1678569920526165 tokens/s +2024-07-30 14:02:53,795 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:53,796 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[716/2067], cost time 1.1460s, every example cost time is 1.1460, generate speed: 6.1082 tokens/s, avg speed: 10.4277 tokens/s, remaining time: 0:30:53 +pred is: + ['Project Mercury and Gemini veterans'] + label is: + ['Mercury and Gemini'] +The F1/Em of this example is: {'F1': 71.42857142857143, 'Em': 0.0} +2024-07-30 14:02:53,878 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:53,878 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 222, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:53,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:53,879 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:53,879 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:54,823 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:54,856 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:54,887 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:54,918 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:54,948 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:54,979 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:55,010 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:55,041 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:55,044 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1645777225494385 s; generated tokens: 8 tokens; generate speed: 6.869442756029008 tokens/s +2024-07-30 14:02:55,049 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:55,049 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[717/2067], cost time 1.1758s, every example cost time is 1.1758, generate speed: 6.8037 tokens/s, avg speed: 10.4234 tokens/s, remaining time: 0:30:51 +pred is: + ['32'] + label is: + ['32'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:02:55,131 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:55,131 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 194, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:55,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:55,132 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:55,132 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:56,074 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:56,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:56,139 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:56,170 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:56,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:56,233 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:56,264 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:56,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:56,326 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:56,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:56,545 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4127893447875977 s; generated tokens: 16 tokens; generate speed: 11.325113725574905 tokens/s +2024-07-30 14:02:56,550 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:56,550 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[718/2067], cost time 1.4240s, every example cost time is 1.4240, generate speed: 11.2358 tokens/s, avg speed: 10.4245 tokens/s, remaining time: 0:30:50 +pred is: + ['1966'] + label is: + ['1966'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:02:56,632 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:56,632 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 189, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:56,632 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:56,633 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:56,633 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:57,576 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:57,609 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:57,641 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:57,644 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0107312202453613 s; generated tokens: 3 tokens; generate speed: 2.968148148497611 tokens/s +2024-07-30 14:02:57,648 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:57,649 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[719/2067], cost time 1.0220s, every example cost time is 1.0220, generate speed: 2.9355 tokens/s, avg speed: 10.4168 tokens/s, remaining time: 0:30:48 +pred is: + ['1'] + label is: + ['unmanned'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:02:57,731 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:57,731 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 225, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:57,732 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:57,732 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:57,732 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:02:58,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:58,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:58,742 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:58,773 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:58,804 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:58,836 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:58,867 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:58,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:58,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:58,969 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:59,278 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5461091995239258 s; generated tokens: 20 tokens; generate speed: 12.935696913360552 tokens/s +2024-07-30 14:02:59,283 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:02:59,283 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[720/2067], cost time 1.5574s, every example cost time is 1.5574, generate speed: 12.8415 tokens/s, avg speed: 10.4206 tokens/s, remaining time: 0:30:47 +pred is: + ['Deke Slayton'] + label is: + ['Deke Slayton'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.16091738419601, Em score: 49.72222222222222, current_count: 720 +2024-07-30 14:02:59,544 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:02:59,545 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 171, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:02:59,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:02:59,545 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:02:59,545 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:00,488 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:00,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:00,553 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:00,584 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:00,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:00,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:00,649 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.103370189666748 s; generated tokens: 6 tokens; generate speed: 5.437884815260584 tokens/s +2024-07-30 14:03:00,654 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:00,654 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[721/2067], cost time 1.1149s, every example cost time is 1.1149, generate speed: 5.3814 tokens/s, avg speed: 10.4149 tokens/s, remaining time: 0:30:45 +pred is: + ['It was canceled.'] + label is: + ['canceled'] +The F1/Em of this example is: {'F1': 28.57142857142857, 'Em': 0.0} +2024-07-30 14:03:00,736 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:00,736 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 185, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:00,737 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:00,737 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:00,737 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:01,680 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:01,713 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:01,744 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:01,780 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:01,811 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:01,841 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:01,873 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:01,904 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:01,935 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:01,966 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:02,061 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.323502779006958 s; generated tokens: 13 tokens; generate speed: 9.822419874141916 tokens/s +2024-07-30 14:03:02,066 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:02,066 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[722/2067], cost time 1.3348s, every example cost time is 1.3348, generate speed: 9.7396 tokens/s, avg speed: 10.4140 tokens/s, remaining time: 0:30:43 +pred is: + ['Samuel Phillips'] + label is: + ['Samuel Phillips'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:03:02,148 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:02,148 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:02,149 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:02,149 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:02,149 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:03,092 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:03,125 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:03,156 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:03,187 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:03,218 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:03,249 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:03,280 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:03,311 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:03,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:03,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:03,685 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5354974269866943 s; generated tokens: 20 tokens; generate speed: 13.025095091985008 tokens/s +2024-07-30 14:03:03,690 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:03,690 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[723/2067], cost time 1.5469s, every example cost time is 1.5469, generate speed: 12.9295 tokens/s, avg speed: 10.4179 tokens/s, remaining time: 0:30:42 +pred is: + ['Altitude Chamber'] + label is: + ['altitude chamber'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:03:03,773 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:03,773 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 178, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:03,773 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:03,774 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:03,774 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:04,716 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:04,749 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:04,780 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:04,811 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:04,842 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:04,873 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:04,904 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:04,935 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:04,966 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:04,968 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.194568157196045 s; generated tokens: 9 tokens; generate speed: 7.534103387725726 tokens/s +2024-07-30 14:03:04,973 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:04,973 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[724/2067], cost time 1.2056s, every example cost time is 1.2056, generate speed: 7.4649 tokens/s, avg speed: 10.4143 tokens/s, remaining time: 0:30:41 +pred is: + ['A strange odor in their spacesuits'] + label is: + ['strange odor in their spacesuits'] +The F1/Em of this example is: {'F1': 90.0, 'Em': 0.0} +2024-07-30 14:03:05,055 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:05,056 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 141, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:05,056 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:05,056 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:05,057 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:05,998 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:06,031 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:06,063 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:06,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:06,125 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:06,156 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:06,187 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:06,218 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:06,250 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:06,282 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:06,592 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5353384017944336 s; generated tokens: 20 tokens; generate speed: 13.026444187564715 tokens/s +2024-07-30 14:03:06,597 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:06,597 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[725/2067], cost time 1.5466s, every example cost time is 1.5466, generate speed: 12.9318 tokens/s, avg speed: 10.4183 tokens/s, remaining time: 0:30:39 +pred is: + ['Congress'] + label is: + ['both houses of Congress'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 14:03:06,680 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:06,680 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 190, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:06,681 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:06,681 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:06,681 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:07,624 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:07,658 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:07,690 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:07,722 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:07,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:07,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:07,786 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.104665756225586 s; generated tokens: 6 tokens; generate speed: 5.43150719227575 tokens/s +2024-07-30 14:03:07,791 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:07,791 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[726/2067], cost time 1.1157s, every example cost time is 1.1157, generate speed: 5.3776 tokens/s, avg speed: 10.4126 tokens/s, remaining time: 0:30:38 +pred is: + ['Nitrogen/Oxygen'] + label is: + ['nitrogen/oxygen mixture'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:03:07,874 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:07,874 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 249, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:07,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:07,875 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:07,875 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:08,818 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:08,851 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:08,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:08,886 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0106682777404785 s; generated tokens: 3 tokens; generate speed: 2.968332999138958 tokens/s +2024-07-30 14:03:08,890 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:08,891 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[727/2067], cost time 1.0220s, every example cost time is 1.0220, generate speed: 2.9355 tokens/s, avg speed: 10.4049 tokens/s, remaining time: 0:30:36 +pred is: + ['J'] + label is: + ['sequence'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:03:08,973 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:08,973 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 353, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:08,974 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:08,974 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:08,974 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:09,919 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:09,952 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:09,984 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:10,015 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:10,046 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:10,077 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:10,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:10,139 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:10,170 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:10,201 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:10,517 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5431761741638184 s; generated tokens: 20 tokens; generate speed: 12.960283041459704 tokens/s +2024-07-30 14:03:10,522 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:10,522 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[728/2067], cost time 1.5546s, every example cost time is 1.5546, generate speed: 12.8653 tokens/s, avg speed: 10.4088 tokens/s, remaining time: 0:30:35 +pred is: + ['AS-501'] + label is: + ['AS-501'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:03:10,605 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:10,605 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 182, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:10,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:10,606 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:10,606 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:11,549 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:11,582 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:11,614 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:11,645 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:11,675 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:11,706 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:11,741 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:11,772 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:11,803 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:11,834 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:12,142 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5360424518585205 s; generated tokens: 20 tokens; generate speed: 13.02047347441549 tokens/s +2024-07-30 14:03:12,147 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:12,147 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[729/2067], cost time 1.5472s, every example cost time is 1.5472, generate speed: 12.9268 tokens/s, avg speed: 10.4127 tokens/s, remaining time: 0:30:34 +pred is: + ['Apollo 5'] + label is: + ['Apollo 5'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:03:12,230 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:12,230 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 277, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:12,231 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:12,231 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:12,231 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:13,176 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:13,208 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:13,239 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:13,270 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:13,301 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:13,332 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:13,363 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:13,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:13,429 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:13,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:13,769 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5379188060760498 s; generated tokens: 20 tokens; generate speed: 13.004587707090568 tokens/s +2024-07-30 14:03:13,774 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:13,774 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[730/2067], cost time 1.5494s, every example cost time is 1.5494, generate speed: 12.9081 tokens/s, avg speed: 10.4165 tokens/s, remaining time: 0:30:32 +pred is: + ['Saturn IB'] + label is: + ['two Saturn IBs'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +F1 score: 62.191002664647336, Em score: 49.58904109589041, current_count: 730 +2024-07-30 14:03:14,036 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:14,037 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 184, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:14,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:14,037 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:14,038 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:14,981 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:15,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:15,045 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:15,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:15,107 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:15,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:15,168 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:15,199 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:15,230 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:15,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:15,577 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5396034717559814 s; generated tokens: 20 tokens; generate speed: 12.990357820633628 tokens/s +2024-07-30 14:03:15,582 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:15,582 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[731/2067], cost time 1.5509s, every example cost time is 1.5509, generate speed: 12.8959 tokens/s, avg speed: 10.4204 tokens/s, remaining time: 0:30:31 +pred is: + ['1'] + label is: + ['Gemini'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:03:15,665 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:15,665 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 181, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:15,665 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:15,666 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:15,666 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:16,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:16,640 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:16,672 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:16,702 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:16,733 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:16,764 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:16,795 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:16,825 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:16,856 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:16,887 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:17,197 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5310378074645996 s; generated tokens: 20 tokens; generate speed: 13.063034696132046 tokens/s +2024-07-30 14:03:17,202 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:17,202 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[732/2067], cost time 1.5422s, every example cost time is 1.5422, generate speed: 12.9687 tokens/s, avg speed: 10.4243 tokens/s, remaining time: 0:30:30 +pred is: + ['Apollo 12'] + label is: + ['Apollo 12'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:03:17,285 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:17,285 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 215, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:17,285 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:17,286 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:17,286 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:18,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:18,262 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:18,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:18,327 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:18,358 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:18,389 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:18,420 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:18,453 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:18,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:18,515 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:18,549 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2629194259643555 s; generated tokens: 11 tokens; generate speed: 8.709977670666111 tokens/s +2024-07-30 14:03:18,554 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:18,554 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[733/2067], cost time 1.2740s, every example cost time is 1.2740, generate speed: 8.6340 tokens/s, avg speed: 10.4220 tokens/s, remaining time: 0:30:29 +pred is: + ['The Lunar Roving Vehicle (LRV)'] + label is: + ['Lunar Roving Vehicle (LRV)'] +The F1/Em of this example is: {'F1': 90.0, 'Em': 0.0} +2024-07-30 14:03:18,637 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:18,637 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 223, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:18,637 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:18,637 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:18,638 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:19,581 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:19,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:19,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:19,681 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:19,712 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:19,743 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:19,774 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:19,805 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:19,836 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:19,870 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:20,182 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5439589023590088 s; generated tokens: 20 tokens; generate speed: 12.953712672948793 tokens/s +2024-07-30 14:03:20,187 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:20,187 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[734/2067], cost time 1.5551s, every example cost time is 1.5551, generate speed: 12.8605 tokens/s, avg speed: 10.4258 tokens/s, remaining time: 0:30:28 +pred is: + ['A liquid oxygen tank exploded, disabling the Service Module and forcing the crew to use the LM as'] + label is: + ['liquid oxygen tank exploded'] +The F1/Em of this example is: {'F1': 32.55813953488372, 'Em': 0.0} +2024-07-30 14:03:20,271 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:20,271 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 230, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:20,271 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:20,272 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:20,272 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:21,215 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:21,248 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:21,286 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:21,318 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:21,349 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:21,380 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:21,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:21,441 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:21,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:21,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:21,811 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5387763977050781 s; generated tokens: 20 tokens; generate speed: 12.99733998378704 tokens/s +2024-07-30 14:03:21,816 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:21,816 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[735/2067], cost time 1.5500s, every example cost time is 1.5500, generate speed: 12.9029 tokens/s, avg speed: 10.4296 tokens/s, remaining time: 0:30:27 +pred is: + ['Apollo 20'] + label is: + ['Apollo 20'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:03:21,898 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:21,898 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 257, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:21,898 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:21,899 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:21,899 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:22,843 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:22,875 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:22,906 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:22,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:22,969 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:22,999 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:23,030 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:23,061 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:23,092 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:23,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:23,432 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5329527854919434 s; generated tokens: 20 tokens; generate speed: 13.046716238936057 tokens/s +2024-07-30 14:03:23,437 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:23,437 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[736/2067], cost time 1.5441s, every example cost time is 1.5441, generate speed: 12.9522 tokens/s, avg speed: 10.4334 tokens/s, remaining time: 0:30:26 +pred is: + ['1'] + label is: + ['extremely old'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:03:23,519 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:23,520 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 158, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:23,520 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:23,520 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:23,520 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:24,462 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:24,495 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:24,526 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:24,557 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:24,588 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:24,618 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:24,649 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:24,681 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:24,712 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:24,742 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:24,776 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2550740242004395 s; generated tokens: 11 tokens; generate speed: 8.764423283326007 tokens/s +2024-07-30 14:03:24,780 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:24,781 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[737/2067], cost time 1.2663s, every example cost time is 1.2663, generate speed: 8.6865 tokens/s, avg speed: 10.4313 tokens/s, remaining time: 0:30:24 +pred is: + ['1'] + label is: + ['micrometeoroid impact craters'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:03:24,864 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:24,864 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 208, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:24,864 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:24,864 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:24,865 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:25,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:25,840 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:25,872 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:25,903 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:25,934 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:25,964 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:25,995 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:26,026 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:26,029 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1640522480010986 s; generated tokens: 8 tokens; generate speed: 6.872543748562435 tokens/s +2024-07-30 14:03:26,034 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:26,034 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[738/2067], cost time 1.1753s, every example cost time is 1.1753, generate speed: 6.8069 tokens/s, avg speed: 10.4270 tokens/s, remaining time: 0:30:22 +pred is: + ['170'] + label is: + ['$170 billion'] +The F1/Em of this example is: {'F1': 40.0, 'Em': 0.0} +2024-07-30 14:03:26,116 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:26,116 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 227, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:26,116 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:26,117 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:26,117 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:27,061 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:27,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:27,125 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:27,156 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:27,187 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:27,218 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:27,249 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:27,281 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:27,312 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:27,343 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:27,664 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.54736328125 s; generated tokens: 20 tokens; generate speed: 12.925213000946671 tokens/s +2024-07-30 14:03:27,669 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:27,670 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[739/2067], cost time 1.5587s, every example cost time is 1.5587, generate speed: 12.8309 tokens/s, avg speed: 10.4307 tokens/s, remaining time: 0:30:21 +pred is: + ['Apollo Extension Series'] + label is: + ['Apollo X'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:03:27,752 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:27,752 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 170, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:27,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:27,753 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:27,753 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:28,696 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:28,728 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:28,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:28,791 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:28,794 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0402157306671143 s; generated tokens: 4 tokens; generate speed: 3.8453561910996172 tokens/s +2024-07-30 14:03:28,798 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:28,799 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[740/2067], cost time 1.0514s, every example cost time is 1.0514, generate speed: 3.8044 tokens/s, avg speed: 10.4239 tokens/s, remaining time: 0:30:19 +pred is: + ['1973'] + label is: + ['1973'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.04322984422626, Em score: 49.32432432432432, current_count: 740 +2024-07-30 14:03:29,064 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:29,065 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 222, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:29,065 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:29,065 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:29,065 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:30,010 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:30,042 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:30,074 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:30,105 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:30,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:30,166 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:30,197 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:30,228 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:30,259 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:30,289 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:30,602 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5361933708190918 s; generated tokens: 20 tokens; generate speed: 13.019194314929301 tokens/s +2024-07-30 14:03:30,607 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:30,607 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[741/2067], cost time 1.5475s, every example cost time is 1.5475, generate speed: 12.9241 tokens/s, avg speed: 10.4277 tokens/s, remaining time: 0:30:18 +pred is: + ['Lunar Reconnaissance Orbiter'] + label is: + ['Lunar Reconnaissance Orbiter'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:03:30,689 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:30,690 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:30,690 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:30,690 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:30,690 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:31,633 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:31,666 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:31,698 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:31,729 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:31,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:31,762 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0717568397521973 s; generated tokens: 5 tokens; generate speed: 4.665237313676541 tokens/s +2024-07-30 14:03:31,767 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:31,767 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[742/2067], cost time 1.0830s, every example cost time is 1.0830, generate speed: 4.6169 tokens/s, avg speed: 10.4215 tokens/s, remaining time: 0:30:16 +pred is: + ['Apollo 8'] + label is: + ['Apollo 8'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:03:31,849 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:31,849 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 166, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:31,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:31,850 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:31,850 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:32,792 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:32,826 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:32,858 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:32,888 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:32,919 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:32,950 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:32,981 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:33,012 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:33,043 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:33,074 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:33,383 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5327470302581787 s; generated tokens: 20 tokens; generate speed: 13.048467623930847 tokens/s +2024-07-30 14:03:33,388 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:33,388 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[743/2067], cost time 1.5440s, every example cost time is 1.5440, generate speed: 12.9538 tokens/s, avg speed: 10.4253 tokens/s, remaining time: 0:30:15 +pred is: + ['A special Apollo TV camera'] + label is: + ['special Apollo TV camera'] +The F1/Em of this example is: {'F1': 87.50000000000001, 'Em': 0.0} +2024-07-30 14:03:33,471 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:33,471 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 146, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:33,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:33,472 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:33,472 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:34,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:34,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:34,479 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:34,510 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:34,541 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:34,572 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:34,602 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:34,633 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:34,663 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:34,694 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:34,757 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2850604057312012 s; generated tokens: 12 tokens; generate speed: 9.338082432920329 tokens/s +2024-07-30 14:03:34,762 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:34,763 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[744/2067], cost time 1.2965s, every example cost time is 1.2965, generate speed: 9.2555 tokens/s, avg speed: 10.4239 tokens/s, remaining time: 0:30:14 +pred is: + ['Nafzger'] + label is: + ['Nafzger'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:03:34,846 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:34,846 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 169, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:34,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:34,847 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:34,847 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:35,789 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:35,822 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:35,853 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:35,884 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:35,915 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:35,946 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:35,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:36,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:36,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:36,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:36,285 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4374868869781494 s; generated tokens: 17 tokens; generate speed: 11.826194836279164 tokens/s +2024-07-30 14:03:36,289 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:36,290 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[745/2067], cost time 1.4487s, every example cost time is 1.4487, generate speed: 11.7350 tokens/s, avg speed: 10.4257 tokens/s, remaining time: 0:30:13 +pred is: + ['primary law, secondary law, supplementary law'] + label is: + ['primary law, secondary law and supplementary law.'] +The F1/Em of this example is: {'F1': 57.14285714285715, 'Em': 0.0} +2024-07-30 14:03:36,373 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:36,373 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 175, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:36,374 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:36,374 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:36,374 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:37,316 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:37,349 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:37,380 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:37,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:37,442 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:37,473 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:37,504 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:37,535 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:37,566 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:37,596 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:37,782 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4077787399291992 s; generated tokens: 16 tokens; generate speed: 11.365422382216599 tokens/s +2024-07-30 14:03:37,787 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:37,787 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[746/2067], cost time 1.4191s, every example cost time is 1.4191, generate speed: 11.2746 tokens/s, avg speed: 10.4269 tokens/s, remaining time: 0:30:11 +pred is: + ['The courts of member states and the Court of Justice of the European Union'] + label is: + ['courts of member states and the Court of Justice of the European Union'] +The F1/Em of this example is: {'F1': 96.15384615384615, 'Em': 0.0} +2024-07-30 14:03:37,872 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:37,872 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 330, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:37,872 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:37,872 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:37,873 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:38,818 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:38,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:38,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:38,913 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:38,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:38,975 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:39,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:39,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:39,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:39,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:39,411 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.537618637084961 s; generated tokens: 20 tokens; generate speed: 13.007126421097679 tokens/s +2024-07-30 14:03:39,415 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:39,416 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[747/2067], cost time 1.5488s, every example cost time is 1.5488, generate speed: 12.9130 tokens/s, avg speed: 10.4306 tokens/s, remaining time: 0:30:10 +pred is: + ['The Treaty on European Union (TEU) and the Treaty on the Functioning of the European'] + label is: + ['Treaty on European Union (TEU) and the Treaty on the Functioning of the European Union (TFEU)'] +The F1/Em of this example is: {'F1': 87.87878787878788, 'Em': 0.0} +2024-07-30 14:03:39,500 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:39,500 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 410, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:39,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:39,501 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:39,501 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:40,447 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:40,480 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:40,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:40,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:40,574 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:40,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:40,637 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:40,669 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:40,700 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:40,731 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:41,044 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5433404445648193 s; generated tokens: 20 tokens; generate speed: 12.95890357207574 tokens/s +2024-07-30 14:03:41,049 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:41,049 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[748/2067], cost time 1.5548s, every example cost time is 1.5548, generate speed: 12.8635 tokens/s, avg speed: 10.4343 tokens/s, remaining time: 0:30:09 +pred is: + ['Treaty on the Functioning of the European Union (TFEU)'] + label is: + ['Treaty on European Union (TEU)'] +The F1/Em of this example is: {'F1': 40.0, 'Em': 0.0} +2024-07-30 14:03:41,133 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:41,133 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 331, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:41,133 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:41,134 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:41,134 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:42,079 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:42,112 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:42,143 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:42,175 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:42,206 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:42,237 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:42,268 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:42,299 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:42,331 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:42,362 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:42,674 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5398859977722168 s; generated tokens: 20 tokens; generate speed: 12.98797445326108 tokens/s +2024-07-30 14:03:42,679 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:42,679 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[749/2067], cost time 1.5513s, every example cost time is 1.5513, generate speed: 12.8926 tokens/s, avg speed: 10.4380 tokens/s, remaining time: 0:30:08 +pred is: + ['1'] + label is: + ['with common rules for coal and steel, and then atomic energy'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:03:42,762 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:42,762 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 162, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:42,763 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:42,763 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:42,763 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:43,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:43,738 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:43,769 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:43,800 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:43,831 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:43,862 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:43,893 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:43,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:43,955 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:43,985 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:44,293 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.529695987701416 s; generated tokens: 20 tokens; generate speed: 13.07449333775976 tokens/s +2024-07-30 14:03:44,298 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:44,298 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[750/2067], cost time 1.5412s, every example cost time is 1.5412, generate speed: 12.9772 tokens/s, avg speed: 10.4418 tokens/s, remaining time: 0:30:07 +pred is: + ['2004'] + label is: + ['Following the Nice Treaty'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 62.10755410120389, Em score: 49.06666666666667, current_count: 750 +2024-07-30 14:03:44,569 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:44,570 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 402, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:44,570 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:44,570 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:44,571 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:45,517 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:45,551 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:45,583 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:45,614 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:45,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:45,677 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:45,708 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:45,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:45,770 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:45,801 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:45,866 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2947778701782227 s; generated tokens: 12 tokens; generate speed: 9.26799899533982 tokens/s +2024-07-30 14:03:45,870 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:45,871 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[751/2067], cost time 1.3062s, every example cost time is 1.3062, generate speed: 9.1869 tokens/s, avg speed: 10.4403 tokens/s, remaining time: 0:30:06 +pred is: + ['The European Commission'] + label is: + ['The European Commission'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:03:45,953 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:45,953 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 325, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:45,954 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:45,954 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:45,954 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:46,899 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:46,932 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:46,963 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:46,994 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:47,026 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:47,057 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:47,088 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:47,119 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:47,150 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:47,181 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:47,184 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2294094562530518 s; generated tokens: 10 tokens; generate speed: 8.133986564962358 tokens/s +2024-07-30 14:03:47,189 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:47,189 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[752/2067], cost time 1.2406s, every example cost time is 1.2406, generate speed: 8.0605 tokens/s, avg speed: 10.4374 tokens/s, remaining time: 0:30:04 +pred is: + ['Santer Commission'] + label is: + ['the Santer Commission'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:03:47,271 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:47,272 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 656, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:47,272 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:47,272 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:47,273 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:48,220 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:48,253 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:48,285 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:48,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:48,348 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:48,380 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:48,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:48,443 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:48,474 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:48,506 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:48,821 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.548680067062378 s; generated tokens: 20 tokens; generate speed: 12.914223166788158 tokens/s +2024-07-30 14:03:48,826 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:48,827 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[753/2067], cost time 1.5600s, every example cost time is 1.5600, generate speed: 12.8202 tokens/s, avg speed: 10.4410 tokens/s, remaining time: 0:30:03 +pred is: + ['The European Parliament and the Council of the European Union'] + label is: + ['the European Parliament and the Council of the European Union'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:03:48,911 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:48,911 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 360, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:48,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:48,912 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:48,912 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:49,858 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:49,891 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:49,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:49,955 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:49,987 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:50,018 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:50,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:50,080 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:50,112 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:50,143 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:50,456 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5444576740264893 s; generated tokens: 20 tokens; generate speed: 12.949529363183427 tokens/s +2024-07-30 14:03:50,461 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:50,461 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[754/2067], cost time 1.5557s, every example cost time is 1.5557, generate speed: 12.8561 tokens/s, avg speed: 10.4446 tokens/s, remaining time: 0:30:02 +pred is: + ['1'] + label is: + ['different ministers of the member states'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:03:50,544 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:50,544 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 399, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:50,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:50,545 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:50,545 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:51,492 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:51,526 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:51,557 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:51,589 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:51,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:51,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:51,682 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:51,713 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:51,744 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:51,776 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:52,088 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5428295135498047 s; generated tokens: 20 tokens; generate speed: 12.9631951063622 tokens/s +2024-07-30 14:03:52,093 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:52,094 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[755/2067], cost time 1.5547s, every example cost time is 1.5547, generate speed: 12.8642 tokens/s, avg speed: 10.4482 tokens/s, remaining time: 0:30:01 +pred is: + ['majority of all MEPs'] + label is: + ['a majority'] +The F1/Em of this example is: {'F1': 20.0, 'Em': 0.0} +2024-07-30 14:03:52,176 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:52,177 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 398, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:52,177 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:52,177 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:52,177 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:53,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:53,156 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:53,188 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:53,220 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:53,251 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:53,282 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:53,313 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:53,345 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:53,376 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:53,406 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:53,720 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5424723625183105 s; generated tokens: 20 tokens; generate speed: 12.966196663223897 tokens/s +2024-07-30 14:03:53,725 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:53,725 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[756/2067], cost time 1.5537s, every example cost time is 1.5537, generate speed: 12.8725 tokens/s, avg speed: 10.4519 tokens/s, remaining time: 0:30:00 +pred is: + ['1'] + label is: + ['judicial branch'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:03:53,807 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:53,807 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 634, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:53,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:53,808 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:53,808 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:54,756 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:54,789 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:54,821 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:54,853 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:54,884 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:54,915 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:54,947 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:54,978 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:55,010 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:55,041 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:55,230 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4217627048492432 s; generated tokens: 16 tokens; generate speed: 11.253636029014112 tokens/s +2024-07-30 14:03:55,235 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:55,235 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[757/2067], cost time 1.4330s, every example cost time is 1.4330, generate speed: 11.1656 tokens/s, avg speed: 10.4529 tokens/s, remaining time: 0:29:59 +pred is: + ['EU law takes precedence over national law.'] + label is: + ['EU law'] +The F1/Em of this example is: {'F1': 35.294117647058826, 'Em': 0.0} +2024-07-30 14:03:55,317 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:55,317 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 448, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:55,318 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:55,318 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:55,318 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:56,265 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:56,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:56,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:56,361 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:56,392 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:56,423 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:56,454 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:56,485 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:56,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:56,548 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:56,859 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5409605503082275 s; generated tokens: 20 tokens; generate speed: 12.978917595261956 tokens/s +2024-07-30 14:03:56,864 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:56,864 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[758/2067], cost time 1.5521s, every example cost time is 1.5521, generate speed: 12.8857 tokens/s, avg speed: 10.4565 tokens/s, remaining time: 0:29:58 +pred is: + ['EU law'] + label is: + ['EU law'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:03:56,946 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:56,946 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 333, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:56,947 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:56,947 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:56,947 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:57,893 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:57,926 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:57,957 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:57,988 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:58,019 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:58,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:58,080 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:58,112 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:58,143 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:58,177 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:58,492 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.545053482055664 s; generated tokens: 20 tokens; generate speed: 12.94453572790916 tokens/s +2024-07-30 14:03:58,497 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:03:58,498 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[759/2067], cost time 1.5563s, every example cost time is 1.5563, generate speed: 12.8510 tokens/s, avg speed: 10.4601 tokens/s, remaining time: 0:29:56 +pred is: + ['Administrative law'] + label is: + ['administrative law'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:03:58,580 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:03:58,580 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 521, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:03:58,581 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:58,581 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:03:58,581 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:03:59,528 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:59,563 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:59,595 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:59,626 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:59,657 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:59,695 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:59,727 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:59,758 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:59,789 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:03:59,821 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:00,136 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5545179843902588 s; generated tokens: 20 tokens; generate speed: 12.865724424439362 tokens/s +2024-07-30 14:04:00,141 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:00,141 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[760/2067], cost time 1.5659s, every example cost time is 1.5659, generate speed: 12.7725 tokens/s, avg speed: 10.4635 tokens/s, remaining time: 0:29:55 +pred is: + ['Van Gend en Loos v Nederlandse Administratie der Belastingen'] + label is: + ['Van Gend en Loos v Nederlandse Administratie der Belastingen'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.11968380730261, Em score: 49.078947368421055, current_count: 760 +2024-07-30 14:04:00,451 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:00,452 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 285, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:00,452 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:00,452 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:00,452 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:01,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:01,431 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:01,463 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:01,495 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:01,526 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:01,557 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:01,589 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:01,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:01,652 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:01,685 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:02,025 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5721704959869385 s; generated tokens: 20 tokens; generate speed: 12.721266587212536 tokens/s +2024-07-30 14:04:02,030 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:02,030 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[761/2067], cost time 1.5841s, every example cost time is 1.5841, generate speed: 12.6252 tokens/s, avg speed: 10.4668 tokens/s, remaining time: 0:29:54 +pred is: + ['Directives do not generally give citizens (as opposed to the member state) standing to sue other'] + label is: + ['Directives'] +The F1/Em of this example is: {'F1': 5.882352941176471, 'Em': 0.0} +2024-07-30 14:04:02,115 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:02,115 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 567, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:02,116 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:02,116 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:02,116 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:03,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:03,098 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:03,130 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:03,161 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:03,193 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:03,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:03,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:03,292 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:03,325 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:03,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:03,679 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5624444484710693 s; generated tokens: 20 tokens; generate speed: 12.800455094304958 tokens/s +2024-07-30 14:04:03,684 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:03,684 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[762/2067], cost time 1.5741s, every example cost time is 1.5741, generate speed: 12.7053 tokens/s, avg speed: 10.4702 tokens/s, remaining time: 0:29:53 +pred is: + ['vertical direct effect'] + label is: + ['the member state cannot enforce conflicting laws, and a citizen may rely on the Directive in such an action'] +The F1/Em of this example is: {'F1': 4.651162790697675, 'Em': 0.0} +2024-07-30 14:04:03,768 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:03,769 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 358, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:03,769 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:03,769 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:03,770 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:04,716 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:04,749 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:04,781 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:04,813 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:04,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:04,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:04,908 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:04,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:04,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:05,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:05,329 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5591001510620117 s; generated tokens: 20 tokens; generate speed: 12.827912296959632 tokens/s +2024-07-30 14:04:05,334 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:05,334 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[763/2067], cost time 1.5709s, every example cost time is 1.5709, generate speed: 12.7315 tokens/s, avg speed: 10.4736 tokens/s, remaining time: 0:29:52 +pred is: + ['1'] + label is: + ['national courts'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:04:05,417 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:05,417 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:05,418 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:05,418 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:05,418 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:06,361 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:06,395 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:06,428 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:06,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:06,492 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:06,524 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:06,556 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:06,587 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:06,619 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:06,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:06,970 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5514116287231445 s; generated tokens: 20 tokens; generate speed: 12.891485167260583 tokens/s +2024-07-30 14:04:06,975 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:06,975 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[764/2067], cost time 1.5634s, every example cost time is 1.5634, generate speed: 12.7929 tokens/s, avg speed: 10.4770 tokens/s, remaining time: 0:29:51 +pred is: + ['European Court of Justice'] + label is: + ['the European Court of Justice'] +The F1/Em of this example is: {'F1': 87.50000000000001, 'Em': 0.0} +2024-07-30 14:04:07,059 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:07,059 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 183, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:07,060 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:07,060 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:07,060 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:08,004 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:08,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:08,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:08,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:08,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:08,163 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:08,194 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:08,225 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:08,256 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:08,287 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:08,620 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.559581995010376 s; generated tokens: 20 tokens; generate speed: 12.823949022229472 tokens/s +2024-07-30 14:04:08,625 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:08,625 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[765/2067], cost time 1.5715s, every example cost time is 1.5715, generate speed: 12.7266 tokens/s, avg speed: 10.4804 tokens/s, remaining time: 0:29:50 +pred is: + ['Since the 1950s'] + label is: + ['since the 1950s'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:04:08,707 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:08,708 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 295, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:08,708 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:08,708 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:08,708 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:09,654 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:09,688 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:09,720 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:09,752 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:09,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:09,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:09,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:09,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:09,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:09,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:10,250 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.541250228881836 s; generated tokens: 20 tokens; generate speed: 12.976478202705495 tokens/s +2024-07-30 14:04:10,255 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:10,255 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[766/2067], cost time 1.5528s, every example cost time is 1.5528, generate speed: 12.8802 tokens/s, avg speed: 10.4839 tokens/s, remaining time: 0:29:49 +pred is: + ['Since the 1960s'] + label is: + ['since the 1960s'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:04:10,337 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:10,338 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 188, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:10,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:10,338 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:10,339 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:11,282 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:11,315 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:11,347 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:11,378 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:11,409 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:11,440 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:11,471 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:11,502 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:11,533 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:11,563 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:11,899 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5601577758789062 s; generated tokens: 20 tokens; generate speed: 12.819216305692615 tokens/s +2024-07-30 14:04:11,904 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:11,904 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[767/2067], cost time 1.5716s, every example cost time is 1.5716, generate speed: 12.7262 tokens/s, avg speed: 10.4872 tokens/s, remaining time: 0:29:48 +pred is: + ['The European Court of Justice is likely to get inspiration from the constitutional traditions common to the member states'] + label is: + ['from the constitutional traditions common to the member states'] +The F1/Em of this example is: {'F1': 62.96296296296296, 'Em': 0.0} +2024-07-30 14:04:11,989 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:11,989 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 271, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:11,990 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:11,990 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:11,990 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:12,935 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:12,968 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:12,999 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:13,030 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:13,061 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:13,092 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:13,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:13,154 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:13,185 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:13,216 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:13,218 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2278385162353516 s; generated tokens: 10 tokens; generate speed: 8.144393475015573 tokens/s +2024-07-30 14:04:13,223 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:13,223 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[768/2067], cost time 1.2394s, every example cost time is 1.2394, generate speed: 8.0684 tokens/s, avg speed: 10.4844 tokens/s, remaining time: 0:29:47 +pred is: + ['0'] + label is: + ['None'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:04:13,306 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:13,307 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 216, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:13,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:13,307 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:13,308 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:14,252 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:14,285 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:14,316 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:14,346 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:14,377 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:14,408 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:14,439 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:14,470 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:14,501 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:14,531 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:14,779 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.471585750579834 s; generated tokens: 18 tokens; generate speed: 12.231703108641575 tokens/s +2024-07-30 14:04:14,784 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:14,784 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[769/2067], cost time 1.4833s, every example cost time is 1.4833, generate speed: 12.1353 tokens/s, avg speed: 10.4867 tokens/s, remaining time: 0:29:45 +pred is: + ['2007'] + label is: + ['2007'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:04:14,867 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:14,867 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 206, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:14,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:14,868 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:14,868 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:15,812 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:15,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:15,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:15,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:15,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:15,968 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:15,999 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:16,002 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.133385419845581 s; generated tokens: 7 tokens; generate speed: 6.176186738800399 tokens/s +2024-07-30 14:04:16,007 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:16,007 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[770/2067], cost time 1.1447s, every example cost time is 1.1447, generate speed: 6.1149 tokens/s, avg speed: 10.4820 tokens/s, remaining time: 0:29:44 +pred is: + ['Treaty of Amsterdam'] + label is: + ['1997 Treaty of Amsterdam'] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +F1 score: 62.01985650075084, Em score: 48.83116883116883, current_count: 770 +2024-07-30 14:04:16,289 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:16,289 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 227, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:16,290 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:16,290 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:16,290 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:17,233 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:17,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:17,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:17,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:17,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:17,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:17,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:17,452 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:17,483 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:17,513 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:17,547 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2562851905822754 s; generated tokens: 11 tokens; generate speed: 8.75597362960365 tokens/s +2024-07-30 14:04:17,551 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:17,552 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[771/2067], cost time 1.2679s, every example cost time is 1.2679, generate speed: 8.6757 tokens/s, avg speed: 10.4798 tokens/s, remaining time: 0:29:42 +pred is: + ['11'] + label is: + ['11 of the then 12 member states'] +The F1/Em of this example is: {'F1': 14.285714285714288, 'Em': 0.0} +2024-07-30 14:04:17,634 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:17,634 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 209, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:17,635 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:17,635 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:17,635 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:18,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:18,611 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:18,642 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:18,673 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:18,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:18,735 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:18,766 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:18,797 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:18,827 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:18,858 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:19,166 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5307817459106445 s; generated tokens: 20 tokens; generate speed: 13.065219815580065 tokens/s +2024-07-30 14:04:19,171 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:19,171 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[772/2067], cost time 1.5421s, every example cost time is 1.5421, generate speed: 12.9696 tokens/s, avg speed: 10.4834 tokens/s, remaining time: 0:29:41 +pred is: + ['The election of the UK Labour Party to government in 1997'] + label is: + ['the election of the UK Labour Party to government'] +The F1/Em of this example is: {'F1': 89.47368421052632, 'Em': 0.0} +2024-07-30 14:04:19,255 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:19,255 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 345, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:19,256 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:19,256 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:19,256 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:20,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:20,236 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:20,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:20,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:20,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:20,360 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:20,391 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:20,422 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:20,455 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:20,487 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:20,821 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.565004825592041 s; generated tokens: 20 tokens; generate speed: 12.779513310723502 tokens/s +2024-07-30 14:04:20,826 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:20,827 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[773/2067], cost time 1.5764s, every example cost time is 1.5764, generate speed: 12.6871 tokens/s, avg speed: 10.4867 tokens/s, remaining time: 0:29:40 +pred is: + ['France, Italy, Belgium, the Netherlands, Luxembourg and Germany'] + label is: + ['France, Italy, Belgium, the Netherlands, Luxembourg and Germany'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:04:20,910 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:20,910 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 311, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:20,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:20,911 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:20,911 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:21,856 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:21,889 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:21,921 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:21,951 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:21,983 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:22,014 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:22,045 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:22,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:22,107 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:22,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:22,447 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.536198616027832 s; generated tokens: 20 tokens; generate speed: 13.019149862088959 tokens/s +2024-07-30 14:04:22,452 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:22,452 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[774/2067], cost time 1.5475s, every example cost time is 1.5475, generate speed: 12.9244 tokens/s, avg speed: 10.4903 tokens/s, remaining time: 0:29:39 +pred is: + ['101'] + label is: + ['Article 101(1)'] +The F1/Em of this example is: {'F1': 28.57142857142857, 'Em': 0.0} +2024-07-30 14:04:22,565 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:22,565 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 495, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:22,566 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:22,566 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:22,566 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:23,514 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:23,548 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:23,580 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:23,611 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:23,643 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:23,675 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:23,707 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:23,738 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:23,771 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:23,802 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:23,805 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2391021251678467 s; generated tokens: 10 tokens; generate speed: 8.070359816908084 tokens/s +2024-07-30 14:04:23,810 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:23,811 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[775/2067], cost time 1.2508s, every example cost time is 1.2508, generate speed: 7.9947 tokens/s, avg speed: 10.4873 tokens/s, remaining time: 0:29:37 +pred is: + ['2007'] + label is: + ['2007'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:04:23,893 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:23,893 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 665, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:23,894 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:23,894 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:23,894 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:24,841 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:24,875 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:24,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:24,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:24,970 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:25,001 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:25,033 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:25,065 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:25,068 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1737241744995117 s; generated tokens: 8 tokens; generate speed: 6.815911415824151 tokens/s +2024-07-30 14:04:25,073 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:25,073 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[776/2067], cost time 1.1854s, every example cost time is 1.1854, generate speed: 6.7488 tokens/s, avg speed: 10.4832 tokens/s, remaining time: 0:29:35 +pred is: + ['The principle of non-discrimination'] + label is: + ['a customs union, and the principle of non-discrimination'] +The F1/Em of this example is: {'F1': 60.86956521739131, 'Em': 0.0} +2024-07-30 14:04:25,157 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:25,157 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 684, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:25,157 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:25,158 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:25,158 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:26,105 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:26,139 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:26,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:26,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:26,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:26,265 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:26,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:26,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:26,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:26,362 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.203796148300171 s; generated tokens: 9 tokens; generate speed: 7.4763488923839105 tokens/s +2024-07-30 14:04:26,367 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:26,367 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[777/2067], cost time 1.2153s, every example cost time is 1.2153, generate speed: 7.4056 tokens/s, avg speed: 10.4797 tokens/s, remaining time: 0:29:34 +pred is: + ['25'] + label is: + ['25'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:04:26,450 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:26,450 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 538, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:26,450 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:26,451 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:26,451 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:27,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:27,433 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:27,465 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:27,497 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:27,528 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:27,559 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:27,590 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:27,622 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:27,653 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:27,684 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:28,001 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5500173568725586 s; generated tokens: 20 tokens; generate speed: 12.903081317975452 tokens/s +2024-07-30 14:04:28,006 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:28,006 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[778/2067], cost time 1.5614s, every example cost time is 1.5614, generate speed: 12.8087 tokens/s, avg speed: 10.4831 tokens/s, remaining time: 0:29:33 +pred is: + ['Keck and Mithouard'] + label is: + ['Keck and Mithouard'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:04:28,088 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:28,089 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 483, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:28,089 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:28,089 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:28,089 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:29,036 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:29,070 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:29,103 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:29,135 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:29,166 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:29,197 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:29,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:29,260 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:29,291 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:29,322 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:29,667 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.577451229095459 s; generated tokens: 20 tokens; generate speed: 12.678680412495787 tokens/s +2024-07-30 14:04:29,672 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:29,672 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[779/2067], cost time 1.5886s, every example cost time is 1.5886, generate speed: 12.5897 tokens/s, avg speed: 10.4862 tokens/s, remaining time: 0:29:32 +pred is: + ['People to pursue their life goals in any country through free movement'] + label is: + ['to enable people to pursue their life goals in any country through free movement'] +The F1/Em of this example is: {'F1': 92.0, 'Em': 0.0} +2024-07-30 14:04:29,756 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:29,756 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 747, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:29,757 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:29,757 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:29,757 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:30,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:30,738 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:30,771 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:30,803 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:30,834 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:30,866 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:30,898 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:30,930 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:30,961 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:30,993 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:31,315 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5576694011688232 s; generated tokens: 20 tokens; generate speed: 12.839694985978838 tokens/s +2024-07-30 14:04:31,320 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:31,320 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[780/2067], cost time 1.5690s, every example cost time is 1.5690, generate speed: 12.7473 tokens/s, avg speed: 10.4895 tokens/s, remaining time: 0:29:31 +pred is: + ['1 to 4'] + label is: + ['articles 1 to 7'] +The F1/Em of this example is: {'F1': 66.66666666666666, 'Em': 0.0} +F1 score: 62.18866226221779, Em score: 48.717948717948715, current_count: 780 +2024-07-30 14:04:31,607 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:31,608 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 180, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:31,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:31,608 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:31,609 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:32,551 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:32,585 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:32,616 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:32,648 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:32,680 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:32,711 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:32,742 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:32,773 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:32,805 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:32,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:33,166 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5572819709777832 s; generated tokens: 20 tokens; generate speed: 12.842889324302933 tokens/s +2024-07-30 14:04:33,171 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:33,171 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[781/2067], cost time 1.5687s, every example cost time is 1.5687, generate speed: 12.7494 tokens/s, avg speed: 10.4928 tokens/s, remaining time: 0:29:30 +pred is: + ['Citizenship of the EU'] + label is: + ['Citizenship of the EU'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:04:33,253 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:33,254 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 494, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:33,254 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:33,254 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:33,254 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:34,201 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:34,236 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:34,268 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:34,301 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:34,332 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:34,364 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:34,395 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:34,427 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:34,459 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:34,490 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:34,803 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5483918190002441 s; generated tokens: 20 tokens; generate speed: 12.916627273911505 tokens/s +2024-07-30 14:04:34,808 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:34,808 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[782/2067], cost time 1.5595s, every example cost time is 1.5595, generate speed: 12.8243 tokens/s, avg speed: 10.4962 tokens/s, remaining time: 0:29:29 +pred is: + ['Treaty on the Functioning of the European Union'] + label is: + ['the Treaty on the Functioning of the European Union'] +The F1/Em of this example is: {'F1': 93.75, 'Em': 0.0} +2024-07-30 14:04:34,890 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:34,891 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 295, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:34,891 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:34,891 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:34,892 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:35,836 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:35,870 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:35,901 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:35,933 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:35,964 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:35,995 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:36,026 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:36,057 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:36,088 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:36,120 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:36,431 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5390710830688477 s; generated tokens: 20 tokens; generate speed: 12.994851387968891 tokens/s +2024-07-30 14:04:36,436 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:36,436 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[783/2067], cost time 1.5503s, every example cost time is 1.5503, generate speed: 12.9009 tokens/s, avg speed: 10.4996 tokens/s, remaining time: 0:29:27 +pred is: + ['2006'] + label is: + ['2006'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:04:36,518 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:36,518 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 834, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:36,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:36,519 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:36,519 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:37,466 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:37,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:37,532 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:37,564 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:37,596 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:37,628 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:37,669 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:37,701 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:37,732 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:37,764 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:38,080 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5604276657104492 s; generated tokens: 20 tokens; generate speed: 12.816999108314434 tokens/s +2024-07-30 14:04:38,084 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:38,085 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[784/2067], cost time 1.5717s, every example cost time is 1.5717, generate speed: 12.7253 tokens/s, avg speed: 10.5029 tokens/s, remaining time: 0:29:26 +pred is: + ['1'] + label is: + ['to people who give services "for remuneration"'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:04:38,167 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:38,167 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 587, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:38,168 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:38,168 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:38,168 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:39,115 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:39,149 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:39,182 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:39,213 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:39,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:39,276 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:39,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:39,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:39,370 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:39,401 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:39,728 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5592882633209229 s; generated tokens: 20 tokens; generate speed: 12.82636473990039 tokens/s +2024-07-30 14:04:39,733 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:39,733 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[785/2067], cost time 1.5706s, every example cost time is 1.5706, generate speed: 12.7339 tokens/s, avg speed: 10.5061 tokens/s, remaining time: 0:29:25 +pred is: + ['1'] + label is: + ['the Daily Mail'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:04:39,815 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:39,815 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 302, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:39,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:39,816 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:39,816 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:40,761 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:40,795 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:40,826 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:40,857 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:40,889 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:40,920 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:40,950 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:40,981 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:41,012 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:41,015 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1991255283355713 s; generated tokens: 9 tokens; generate speed: 7.505469433623283 tokens/s +2024-07-30 14:04:41,020 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:41,020 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[786/2067], cost time 1.2103s, every example cost time is 1.2103, generate speed: 7.4362 tokens/s, avg speed: 10.5027 tokens/s, remaining time: 0:29:24 +pred is: + ['Amazonia'] + label is: + ['also known in English as Amazonia or the Amazon Jungle,'] +The F1/Em of this example is: {'F1': 9.523809523809524, 'Em': 0.0} +2024-07-30 14:04:41,114 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:41,114 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 201, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:41,114 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:41,115 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:41,115 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:42,058 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:42,091 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:42,122 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:42,153 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:42,184 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:42,215 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:42,246 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:42,277 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:42,308 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:42,339 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:42,589 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4739434719085693 s; generated tokens: 18 tokens; generate speed: 12.212137265136965 tokens/s +2024-07-30 14:04:42,594 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:42,594 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[787/2067], cost time 1.4855s, every example cost time is 1.4855, generate speed: 12.1175 tokens/s, avg speed: 10.5049 tokens/s, remaining time: 0:29:23 +pred is: + ['1'] + label is: + ['the wetter climate may have allowed the tropical rainforest to spread out across the continent.'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:04:42,677 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:42,677 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 163, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:42,678 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:42,678 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:42,678 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:43,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:43,653 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:43,684 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:43,715 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:43,746 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:43,777 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:43,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:43,839 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:43,870 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:43,901 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:44,209 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5304183959960938 s; generated tokens: 20 tokens; generate speed: 13.068321742815124 tokens/s +2024-07-30 14:04:44,214 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:44,214 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[788/2067], cost time 1.5415s, every example cost time is 1.5415, generate speed: 12.9740 tokens/s, avg speed: 10.5084 tokens/s, remaining time: 0:29:21 +pred is: + ['1'] + label is: + ['During the mid-Eocene, it is believed that the drainage basin of the Amazon was split along the middle of the continent by the Purus Arch.'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:04:44,297 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:44,298 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 240, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:44,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:44,298 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:44,298 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:45,242 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:45,275 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:45,306 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:45,337 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:45,368 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:45,399 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:45,429 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:45,463 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:45,494 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:45,525 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:45,650 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3514060974121094 s; generated tokens: 14 tokens; generate speed: 10.35958031180225 tokens/s +2024-07-30 14:04:45,655 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:45,655 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[789/2067], cost time 1.3625s, every example cost time is 1.3625, generate speed: 10.2752 tokens/s, avg speed: 10.5081 tokens/s, remaining time: 0:29:20 +pred is: + ['Last Glacial Maximum'] + label is: + ['Last Glacial Maximum'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:04:45,738 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:45,738 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 191, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:45,738 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:45,738 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:45,739 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:46,681 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:46,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:46,745 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:46,776 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:46,807 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:46,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:46,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:46,899 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:46,930 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:46,933 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1941664218902588 s; generated tokens: 9 tokens; generate speed: 7.536637971911657 tokens/s +2024-07-30 14:04:46,938 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:46,938 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[790/2067], cost time 1.2052s, every example cost time is 1.2052, generate speed: 7.4674 tokens/s, avg speed: 10.5047 tokens/s, remaining time: 0:29:18 +pred is: + ['CALIPSO'] + label is: + ['CALIPSO'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.03851946082745, Em score: 48.607594936708864, current_count: 790 +2024-07-30 14:04:47,234 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:47,235 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 252, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:47,235 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:47,235 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:47,236 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:48,180 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:48,213 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:48,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:48,276 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:48,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:48,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:48,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:48,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:48,431 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:48,463 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:48,558 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3222970962524414 s; generated tokens: 13 tokens; generate speed: 9.831376047670117 tokens/s +2024-07-30 14:04:48,563 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:48,563 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[791/2067], cost time 1.3339s, every example cost time is 1.3339, generate speed: 9.7460 tokens/s, avg speed: 10.5038 tokens/s, remaining time: 0:29:17 +pred is: + ['Amazonia: Man and Culture in a Counterfeit Paradise'] + label is: + ['Man and Culture in a Counterfeit Paradise'] +The F1/Em of this example is: {'F1': 92.85714285714286, 'Em': 0.0} +2024-07-30 14:04:48,646 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:48,646 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 259, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:48,647 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:48,647 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:48,647 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:49,591 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:49,624 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:49,655 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:49,695 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:49,726 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:49,757 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:49,788 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:49,819 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:49,822 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1746373176574707 s; generated tokens: 8 tokens; generate speed: 6.810612841718719 tokens/s +2024-07-30 14:04:49,827 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:49,827 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[792/2067], cost time 1.1858s, every example cost time is 1.1858, generate speed: 6.7468 tokens/s, avg speed: 10.4997 tokens/s, remaining time: 0:29:15 +pred is: + ['Francisco de Orellana'] + label is: + ['Francisco de Orellana'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:04:49,909 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:49,910 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 179, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:49,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:49,910 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:49,910 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:50,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:50,888 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:50,919 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:50,950 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:50,981 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:51,012 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:51,043 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:51,074 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:51,105 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:51,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:51,354 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4433064460754395 s; generated tokens: 17 tokens; generate speed: 11.77851041005566 tokens/s +2024-07-30 14:04:51,359 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:51,359 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[793/2067], cost time 1.4545s, every example cost time is 1.4545, generate speed: 11.6877 tokens/s, avg speed: 10.5013 tokens/s, remaining time: 0:29:14 +pred is: + ['Black earth'] + label is: + ['black earth'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:04:51,442 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:51,442 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 183, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:51,443 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:51,443 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:51,443 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:52,386 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:52,419 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:52,450 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:52,481 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:52,484 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.04020094871521 s; generated tokens: 4 tokens; generate speed: 3.8454108361855903 tokens/s +2024-07-30 14:04:52,488 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:52,489 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[794/2067], cost time 1.0526s, every example cost time is 1.0526, generate speed: 3.7999 tokens/s, avg speed: 10.4949 tokens/s, remaining time: 0:29:12 +pred is: + ['250000'] + label is: + ['2.5 million'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:04:52,570 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:52,570 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 192, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:52,571 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:52,571 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:52,571 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:53,514 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:53,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:53,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:53,609 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:53,640 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:53,671 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:53,702 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:53,733 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:53,736 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1644623279571533 s; generated tokens: 8 tokens; generate speed: 6.870123496424834 tokens/s +2024-07-30 14:04:53,741 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:53,741 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[795/2067], cost time 1.1755s, every example cost time is 1.1755, generate speed: 6.8055 tokens/s, avg speed: 10.4909 tokens/s, remaining time: 0:29:10 +pred is: + ['62'] + label is: + ['62 acres'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:04:53,822 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:53,823 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 175, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:53,823 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:53,823 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:53,824 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:54,766 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:54,799 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:54,830 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:54,861 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:54,891 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:54,894 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0704748630523682 s; generated tokens: 5 tokens; generate speed: 4.670824297305707 tokens/s +2024-07-30 14:04:54,899 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:54,899 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[796/2067], cost time 1.0816s, every example cost time is 1.0816, generate speed: 4.6228 tokens/s, avg speed: 10.4851 tokens/s, remaining time: 0:29:09 +pred is: + ['electric eel'] + label is: + ['electric eels'] +The F1/Em of this example is: {'F1': 66.66666666666666, 'Em': 0.0} +2024-07-30 14:04:54,981 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:54,981 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 217, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:54,982 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:54,982 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:54,982 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:55,925 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:55,957 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:55,988 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:56,019 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:56,022 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.039597511291504 s; generated tokens: 4 tokens; generate speed: 3.8476429161808534 tokens/s +2024-07-30 14:04:56,027 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:56,027 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[797/2067], cost time 1.0506s, every example cost time is 1.0506, generate speed: 3.8072 tokens/s, avg speed: 10.4787 tokens/s, remaining time: 0:29:07 +pred is: + ['Deforestation'] + label is: + ['Deforestation'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:04:56,108 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:56,109 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 225, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:56,109 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:56,109 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:56,110 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:57,053 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:57,086 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:57,118 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:57,149 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:57,180 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:57,211 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:57,242 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:57,273 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:57,305 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:57,336 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:57,370 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2601001262664795 s; generated tokens: 11 tokens; generate speed: 8.72946504068025 tokens/s +2024-07-30 14:04:57,375 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:57,375 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[798/2067], cost time 1.2711s, every example cost time is 1.2711, generate speed: 8.6536 tokens/s, avg speed: 10.4766 tokens/s, remaining time: 0:29:05 +pred is: + ['415000'] + label is: + ['415,000'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:04:57,457 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:57,457 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 184, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:57,458 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:57,458 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:57,458 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:04:58,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:58,433 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:58,465 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:58,496 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:58,527 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:58,557 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:58,589 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:58,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:58,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:58,682 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:58,990 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5322911739349365 s; generated tokens: 20 tokens; generate speed: 13.052349540485725 tokens/s +2024-07-30 14:04:58,995 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:04:58,996 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[799/2067], cost time 1.5436s, every example cost time is 1.5436, generate speed: 12.9571 tokens/s, avg speed: 10.4801 tokens/s, remaining time: 0:29:04 +pred is: + ['1'] + label is: + ['soy farmers'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:04:59,077 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:04:59,078 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 166, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:04:59,078 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:04:59,078 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:04:59,078 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:00,021 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:00,054 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:00,085 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:00,116 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:00,147 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:00,178 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:00,209 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:00,240 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:00,271 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:00,302 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:00,625 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.546811819076538 s; generated tokens: 20 tokens; generate speed: 12.929821037920565 tokens/s +2024-07-30 14:05:00,630 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:00,631 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[800/2067], cost time 1.5581s, every example cost time is 1.5581, generate speed: 12.8363 tokens/s, avg speed: 10.4834 tokens/s, remaining time: 0:29:03 +pred is: + ['1'] + label is: + ['loss of biodiversity'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 61.899942729471874, Em score: 48.375, current_count: 800 +2024-07-30 14:05:00,925 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:00,925 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 155, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:00,926 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:00,926 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:00,926 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:01,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:01,901 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:01,933 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:01,966 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:01,998 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:02,029 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:02,060 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:02,091 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:02,094 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1676287651062012 s; generated tokens: 8 tokens; generate speed: 6.8514927338847835 tokens/s +2024-07-30 14:05:02,099 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:02,099 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[801/2067], cost time 1.1790s, every example cost time is 1.1790, generate speed: 6.7856 tokens/s, avg speed: 10.4794 tokens/s, remaining time: 0:29:01 +pred is: + ['Reduced rainfall and increased temperatures'] + label is: + ['reduced rainfall and increased temperatures'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:05:02,182 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:02,182 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 148, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:02,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:02,183 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:02,183 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:03,125 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:03,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:03,190 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:03,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:03,252 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:03,283 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:03,314 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:03,345 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:03,376 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:03,407 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:03,716 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5326967239379883 s; generated tokens: 20 tokens; generate speed: 13.048895901997886 tokens/s +2024-07-30 14:05:03,721 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:03,721 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[802/2067], cost time 1.5440s, every example cost time is 1.5440, generate speed: 12.9534 tokens/s, avg speed: 10.4829 tokens/s, remaining time: 0:29:00 +pred is: + ['Indigenous territories'] + label is: + ['indigenous territories'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:05:03,803 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:03,803 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 150, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:03,804 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:03,804 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:03,804 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:04,746 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:04,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:04,811 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:04,841 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:04,872 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:04,903 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:04,934 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:04,964 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:04,995 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:05,026 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:05,334 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.528984785079956 s; generated tokens: 20 tokens; generate speed: 13.080574898561943 tokens/s +2024-07-30 14:05:05,338 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:05,339 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[803/2067], cost time 1.5402s, every example cost time is 1.5402, generate speed: 12.9853 tokens/s, avg speed: 10.4864 tokens/s, remaining time: 0:28:59 +pred is: + ['1'] + label is: + ['remote sensing'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:05:05,422 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:05,422 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 186, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:05,422 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:05,423 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:05,423 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:06,366 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:06,399 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:06,431 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:06,461 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:06,494 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:06,526 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:06,556 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:06,587 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:06,618 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:06,649 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:06,958 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.535322666168213 s; generated tokens: 20 tokens; generate speed: 13.026577696475409 tokens/s +2024-07-30 14:05:06,963 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:06,963 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[804/2067], cost time 1.5466s, every example cost time is 1.5466, generate speed: 12.9319 tokens/s, avg speed: 10.4898 tokens/s, remaining time: 0:28:58 +pred is: + ['1'] + label is: + ['tree growth'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:05:07,046 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:07,046 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 205, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:07,047 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:07,047 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:07,047 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:07,990 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:08,023 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:08,055 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:08,086 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:08,116 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:08,147 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:08,178 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:08,209 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:08,240 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:08,271 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:08,305 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2569494247436523 s; generated tokens: 11 tokens; generate speed: 8.751346540648115 tokens/s +2024-07-30 14:05:08,309 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:08,309 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[805/2067], cost time 1.2680s, every example cost time is 1.2680, generate speed: 8.6749 tokens/s, avg speed: 10.4877 tokens/s, remaining time: 0:28:56 +pred is: + ['2005'] + label is: + ['2005'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:05:08,391 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:08,391 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 213, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:08,392 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:08,392 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:08,392 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:09,335 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:09,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:09,401 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:09,433 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:09,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:09,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:09,535 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:09,566 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:09,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:09,636 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:09,670 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2773706912994385 s; generated tokens: 11 tokens; generate speed: 8.611439165564356 tokens/s +2024-07-30 14:05:09,674 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:09,675 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[806/2067], cost time 1.2885s, every example cost time is 1.2885, generate speed: 8.5371 tokens/s, avg speed: 10.4855 tokens/s, remaining time: 0:28:55 +pred is: + ['2010'] + label is: + ['2010'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:05:09,757 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:09,758 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 319, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:09,758 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:09,758 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:09,758 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:10,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:10,737 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:10,768 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:10,799 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:10,830 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:10,861 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:10,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:10,923 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:10,954 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:10,986 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:11,296 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5373609066009521 s; generated tokens: 20 tokens; generate speed: 13.009306997547672 tokens/s +2024-07-30 14:05:11,301 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:11,301 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[807/2067], cost time 1.5488s, every example cost time is 1.5488, generate speed: 12.9134 tokens/s, avg speed: 10.4889 tokens/s, remaining time: 0:28:54 +pred is: + ['comb jellies'] + label is: + ['comb jellies'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:05:11,384 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:11,384 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 298, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:11,384 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:11,385 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:11,385 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:12,330 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:12,362 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:12,394 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:12,425 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:12,456 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:12,487 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:12,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:12,549 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:12,580 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:12,611 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:12,921 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.536360263824463 s; generated tokens: 20 tokens; generate speed: 13.017780055189649 tokens/s +2024-07-30 14:05:12,926 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:12,926 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[808/2067], cost time 1.5475s, every example cost time is 1.5475, generate speed: 12.9243 tokens/s, avg speed: 10.4922 tokens/s, remaining time: 0:28:53 +pred is: + ['10 times their own weight'] + label is: + ['ten times their own weight'] +The F1/Em of this example is: {'F1': 88.88888888888889, 'Em': 0.0} +2024-07-30 14:05:13,009 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:13,010 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 287, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:13,010 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:13,010 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:13,010 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:13,954 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:13,987 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:14,019 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:14,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:14,081 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:14,112 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:14,115 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1045687198638916 s; generated tokens: 6 tokens; generate speed: 5.431984350180891 tokens/s +2024-07-30 14:05:14,120 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:14,120 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[809/2067], cost time 1.1157s, every example cost time is 1.1157, generate speed: 5.3780 tokens/s, avg speed: 10.4871 tokens/s, remaining time: 0:28:51 +pred is: + ['Hermaprodites'] + label is: + ['Most species are hermaphrodites'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:05:14,203 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:14,203 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 240, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:14,204 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:14,204 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:14,204 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:15,148 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:15,181 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:15,212 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:15,243 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:15,274 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:15,305 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:15,336 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:15,366 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:15,399 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:15,431 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:15,741 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5371639728546143 s; generated tokens: 20 tokens; generate speed: 13.010973684777877 tokens/s +2024-07-30 14:05:15,746 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:15,746 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[810/2067], cost time 1.5485s, every example cost time is 1.5485, generate speed: 12.9161 tokens/s, avg speed: 10.4905 tokens/s, remaining time: 0:28:50 +pred is: + ['Black Sea'] + label is: + ['the Black Sea'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +F1 score: 61.955361817859746, Em score: 48.39506172839506, current_count: 810 +2024-07-30 14:05:16,044 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:16,044 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 280, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:16,045 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:16,045 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:16,045 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:16,989 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:17,022 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:17,053 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:17,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:17,115 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:17,146 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:17,177 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:17,208 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:17,239 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:17,270 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:17,579 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5342519283294678 s; generated tokens: 20 tokens; generate speed: 13.035668804259874 tokens/s +2024-07-30 14:05:17,584 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:17,584 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[811/2067], cost time 1.5458s, every example cost time is 1.5458, generate speed: 12.9384 tokens/s, avg speed: 10.4939 tokens/s, remaining time: 0:28:49 +pred is: + ['66 million years ago'] + label is: + ['66 million years ago'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:05:17,673 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:17,674 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 179, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:17,674 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:17,674 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:17,675 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:18,617 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:18,650 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:18,681 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:18,712 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:18,715 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.040464162826538 s; generated tokens: 4 tokens; generate speed: 3.8444380334384123 tokens/s +2024-07-30 14:05:18,720 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:18,720 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[812/2067], cost time 1.0518s, every example cost time is 1.0518, generate speed: 3.8029 tokens/s, avg speed: 10.4876 tokens/s, remaining time: 0:28:47 +pred is: + ['Cnidarians'] + label is: + ['cnidarians'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:05:18,802 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:18,802 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 188, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:18,802 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:18,803 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:18,803 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:19,746 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:19,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:19,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:19,841 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:19,844 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0411112308502197 s; generated tokens: 4 tokens; generate speed: 3.84204865097211 tokens/s +2024-07-30 14:05:19,849 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:19,849 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[813/2067], cost time 1.0522s, every example cost time is 1.0522, generate speed: 3.8016 tokens/s, avg speed: 10.4813 tokens/s, remaining time: 0:28:45 +pred is: + ['mesoglea'] + label is: + ['mesoglea'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:05:19,931 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:19,932 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 201, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:19,932 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:19,932 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:19,933 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:20,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:20,909 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:20,941 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:20,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:21,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:21,035 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:21,066 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:21,096 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:21,127 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:21,158 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:21,438 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.505523681640625 s; generated tokens: 19 tokens; generate speed: 12.620193379684999 tokens/s +2024-07-30 14:05:21,443 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:21,443 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[814/2067], cost time 1.5168s, every example cost time is 1.5168, generate speed: 12.5261 tokens/s, avg speed: 10.4841 tokens/s, remaining time: 0:28:44 +pred is: + ['cilia'] + label is: + ['cilia'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:05:21,526 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:21,526 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 184, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:21,526 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:21,527 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:21,527 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:22,470 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:22,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:22,534 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:22,565 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:22,596 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:22,628 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:22,658 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:22,689 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:22,692 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1654002666473389 s; generated tokens: 8 tokens; generate speed: 6.864594276277848 tokens/s +2024-07-30 14:05:22,697 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:22,697 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[815/2067], cost time 1.1766s, every example cost time is 1.1766, generate speed: 6.7993 tokens/s, avg speed: 10.4802 tokens/s, remaining time: 0:28:42 +pred is: + ['Pleurobrachia'] + label is: + ['Pleurobrachia'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:05:22,780 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:22,780 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 314, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:22,781 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:22,781 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:22,781 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:23,726 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:23,759 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:23,791 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:23,823 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:23,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:23,885 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:23,888 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.106966495513916 s; generated tokens: 6 tokens; generate speed: 5.420218248985452 tokens/s +2024-07-30 14:05:23,893 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:23,893 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[816/2067], cost time 1.1181s, every example cost time is 1.1181, generate speed: 5.3663 tokens/s, avg speed: 10.4751 tokens/s, remaining time: 0:28:40 +pred is: + ['a pharynx'] + label is: + ['epithelium'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:05:23,980 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:23,980 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 314, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:23,980 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:23,981 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:23,981 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:24,926 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:24,959 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:24,991 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:25,022 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:25,053 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:25,083 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:25,114 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:25,145 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:25,176 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:25,207 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:25,240 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.259014368057251 s; generated tokens: 11 tokens; generate speed: 8.736993221907216 tokens/s +2024-07-30 14:05:25,245 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:25,245 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[817/2067], cost time 1.2705s, every example cost time is 1.2705, generate speed: 8.6580 tokens/s, avg speed: 10.4730 tokens/s, remaining time: 0:28:39 +pred is: + ['swimming-plates'] + label is: + ['swimming-plates'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:05:25,327 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:25,327 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 170, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:25,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:25,328 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:25,328 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:26,271 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:26,304 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:26,335 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:26,366 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:26,397 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:26,429 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:26,459 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:26,490 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:26,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:26,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:26,554 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2260189056396484 s; generated tokens: 10 tokens; generate speed: 8.156481073823834 tokens/s +2024-07-30 14:05:26,559 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:26,559 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[818/2067], cost time 1.2371s, every example cost time is 1.2371, generate speed: 8.0836 tokens/s, avg speed: 10.4704 tokens/s, remaining time: 0:28:37 +pred is: + ['By pumping water into the mesoglea'] + label is: + ['osmotic pressure'] +The F1/Em of this example is: {'F1': 14.285714285714288, 'Em': 0.0} +2024-07-30 14:05:26,643 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:26,643 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 207, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:26,643 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:26,644 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:26,644 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:27,587 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:27,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:27,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:27,682 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:27,713 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:27,744 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:27,747 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.10319185256958 s; generated tokens: 6 tokens; generate speed: 5.438763879577846 tokens/s +2024-07-30 14:05:27,752 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:27,752 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[819/2067], cost time 1.1145s, every example cost time is 1.1145, generate speed: 5.3837 tokens/s, avg speed: 10.4654 tokens/s, remaining time: 0:28:35 +pred is: + ['The aboral organ'] + label is: + ['aboral organ'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:05:27,834 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:27,834 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:27,834 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:27,835 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:27,835 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:28,777 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:28,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:28,840 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:28,871 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:28,903 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:28,905 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0701608657836914 s; generated tokens: 5 tokens; generate speed: 4.672194769838122 tokens/s +2024-07-30 14:05:28,910 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:28,910 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[820/2067], cost time 1.0812s, every example cost time is 1.0812, generate speed: 4.6244 tokens/s, avg speed: 10.4598 tokens/s, remaining time: 0:28:33 +pred is: + ['Sea Gooseberry'] + label is: + ['sea gooseberry'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.16235217896599, Em score: 48.65853658536585, current_count: 820 +2024-07-30 14:05:29,224 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:29,224 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 486, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:29,225 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:29,225 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:29,226 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:30,175 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:30,208 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:30,240 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:30,272 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:30,303 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:30,334 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:30,366 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:30,397 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:30,428 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:30,459 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:30,771 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5454628467559814 s; generated tokens: 20 tokens; generate speed: 12.941106958333673 tokens/s +2024-07-30 14:05:30,776 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:30,776 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[821/2067], cost time 1.5596s, every example cost time is 1.5596, generate speed: 12.8239 tokens/s, avg speed: 10.4630 tokens/s, remaining time: 0:28:32 +pred is: + ['tentilla'] + label is: + ['tentilla'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:05:30,860 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:30,860 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 164, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:30,860 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:30,861 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:30,861 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:31,803 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:31,836 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:31,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:31,872 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0107669830322266 s; generated tokens: 3 tokens; generate speed: 2.9680431299805825 tokens/s +2024-07-30 14:05:31,876 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:31,877 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[822/2067], cost time 1.0220s, every example cost time is 1.0220, generate speed: 2.9354 tokens/s, avg speed: 10.4562 tokens/s, remaining time: 0:28:30 +pred is: + ['8'] + label is: + ['eight rows'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:05:31,959 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:31,959 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 180, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:31,960 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:31,960 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:31,960 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:32,903 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:32,936 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:32,967 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:32,997 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:33,028 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:33,059 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:33,090 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:33,121 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:33,152 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:33,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:33,496 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5356953144073486 s; generated tokens: 20 tokens; generate speed: 13.023416697548722 tokens/s +2024-07-30 14:05:33,501 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:33,501 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[823/2067], cost time 1.5470s, every example cost time is 1.5470, generate speed: 12.9284 tokens/s, avg speed: 10.4596 tokens/s, remaining time: 0:28:29 +pred is: + ['1'] + label is: + ['lobes'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:05:33,584 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:33,584 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 271, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:33,584 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:33,585 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:33,585 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:34,529 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:34,562 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:34,593 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:34,625 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:34,656 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:34,687 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:34,718 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:34,749 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:34,780 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:34,812 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:35,121 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.536005973815918 s; generated tokens: 20 tokens; generate speed: 13.02078269286529 tokens/s +2024-07-30 14:05:35,126 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:35,126 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[824/2067], cost time 1.5472s, every example cost time is 1.5472, generate speed: 12.9269 tokens/s, avg speed: 10.4630 tokens/s, remaining time: 0:28:28 +pred is: + ['1'] + label is: + ['by clapping their lobes'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:05:35,210 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:35,210 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 215, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:35,211 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:35,211 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:35,211 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:36,154 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:36,187 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:36,218 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:36,249 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:36,280 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:36,311 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:36,342 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:36,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:36,404 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:36,435 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:36,745 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.533358097076416 s; generated tokens: 20 tokens; generate speed: 13.043267608612162 tokens/s +2024-07-30 14:05:36,750 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:36,750 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[825/2067], cost time 1.5460s, every example cost time is 1.5460, generate speed: 12.9362 tokens/s, avg speed: 10.4664 tokens/s, remaining time: 0:28:27 +pred is: + ['Nuda'] + label is: + ['Nuda'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:05:36,832 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:36,832 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 246, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:36,832 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:36,833 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:36,833 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:37,777 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:37,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:37,842 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:37,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:37,905 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:37,936 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:37,967 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:37,997 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:38,028 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:38,060 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:38,154 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3214046955108643 s; generated tokens: 13 tokens; generate speed: 9.838015593681623 tokens/s +2024-07-30 14:05:38,160 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:38,160 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[826/2067], cost time 1.3329s, every example cost time is 1.3329, generate speed: 9.7533 tokens/s, avg speed: 10.4655 tokens/s, remaining time: 0:28:26 +pred is: + ['Cestum veneris'] + label is: + ['The Cestida'] +The F1/Em of this example is: {'F1': 33.33333333333333, 'Em': 0.0} +2024-07-30 14:05:38,242 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:38,243 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 184, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:38,243 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:38,243 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:38,243 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:39,186 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:39,218 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:39,250 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:39,280 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:39,311 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:39,342 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:39,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:39,405 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:39,436 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:39,468 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:39,785 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.541213035583496 s; generated tokens: 20 tokens; generate speed: 12.976791357353198 tokens/s +2024-07-30 14:05:39,790 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:39,790 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[827/2067], cost time 1.5526s, every example cost time is 1.5526, generate speed: 12.8820 tokens/s, avg speed: 10.4688 tokens/s, remaining time: 0:28:25 +pred is: + ['A pair of tentilla-bearing tentacles'] + label is: + ['a pair of tentilla-bearing tentacles'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:05:39,873 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:39,873 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 193, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:39,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:39,874 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:39,874 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:40,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:40,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:40,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:40,913 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:40,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:40,975 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:41,005 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:41,036 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:41,067 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:41,098 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:41,192 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3180880546569824 s; generated tokens: 13 tokens; generate speed: 9.862770513752288 tokens/s +2024-07-30 14:05:41,197 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:41,197 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[828/2067], cost time 1.3292s, every example cost time is 1.3292, generate speed: 9.7805 tokens/s, avg speed: 10.4680 tokens/s, remaining time: 0:28:23 +pred is: + ['via pores in the epidermis'] + label is: + ['via pores in the epidermis'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:05:41,280 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:41,280 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 187, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:41,280 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:41,281 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:41,281 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:42,224 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:42,257 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:42,288 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:42,319 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:42,322 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0405380725860596 s; generated tokens: 4 tokens; generate speed: 3.8441649617478775 tokens/s +2024-07-30 14:05:42,326 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:42,327 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[829/2067], cost time 1.0520s, every example cost time is 1.0520, generate speed: 3.8023 tokens/s, avg speed: 10.4619 tokens/s, remaining time: 0:28:21 +pred is: + ['tentacles'] + label is: + ['tentacles and tentacle sheaths'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 14:05:42,409 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:42,409 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 198, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:42,410 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:42,410 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:42,410 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:43,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:43,387 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:43,419 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:43,450 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:43,481 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:43,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:43,542 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:43,573 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:43,604 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:43,635 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:43,947 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5363092422485352 s; generated tokens: 20 tokens; generate speed: 13.018212381986384 tokens/s +2024-07-30 14:05:43,952 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:43,952 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[830/2067], cost time 1.5478s, every example cost time is 1.5478, generate speed: 12.9217 tokens/s, avg speed: 10.4652 tokens/s, remaining time: 0:28:20 +pred is: + ['They produce secretions (ink) that luminesce at much the same wavelengths as their bodies'] + label is: + ['they produce secretions (ink) that luminesce'] +The F1/Em of this example is: {'F1': 61.904761904761905, 'Em': 0.0} +F1 score: 62.04020106263879, Em score: 48.55421686746988, current_count: 830 +2024-07-30 14:05:44,255 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:44,255 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 426, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:44,256 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:44,256 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:44,256 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:45,203 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:45,236 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:45,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:45,270 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0136826038360596 s; generated tokens: 3 tokens; generate speed: 2.959506248452087 tokens/s +2024-07-30 14:05:45,275 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:45,275 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[831/2067], cost time 1.0251s, every example cost time is 1.0251, generate speed: 2.9265 tokens/s, avg speed: 10.4584 tokens/s, remaining time: 0:28:18 +pred is: + ['Predators'] + label is: + ['Almost all ctenophores are predators'] +The F1/Em of this example is: {'F1': 20.0, 'Em': 0.0} +2024-07-30 14:05:45,357 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:45,357 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 330, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:45,358 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:45,358 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:45,358 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:46,303 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:46,336 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:46,367 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:46,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:46,429 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:46,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:46,491 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:46,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:46,553 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:46,584 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:46,892 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5338828563690186 s; generated tokens: 20 tokens; generate speed: 13.038805353978374 tokens/s +2024-07-30 14:05:46,897 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:46,898 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[832/2067], cost time 1.5453s, every example cost time is 1.5453, generate speed: 12.9428 tokens/s, avg speed: 10.4618 tokens/s, remaining time: 0:28:17 +pred is: + ['It was thought that ctenophores were a poor diet for other animals because of their low'] + label is: + ['their low ratio of organic matter to salt and water'] +The F1/Em of this example is: {'F1': 12.000000000000002, 'Em': 0.0} +2024-07-30 14:05:46,981 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:46,982 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 318, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:46,982 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:46,982 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:46,982 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:47,928 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:47,961 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:47,993 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:48,023 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:48,054 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:48,086 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:48,117 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:48,148 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:48,179 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:48,210 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:48,520 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5371417999267578 s; generated tokens: 20 tokens; generate speed: 13.011161365173315 tokens/s +2024-07-30 14:05:48,525 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:48,525 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[833/2067], cost time 1.5488s, every example cost time is 1.5488, generate speed: 12.9128 tokens/s, avg speed: 10.4651 tokens/s, remaining time: 0:28:16 +pred is: + ['1'] + label is: + ['ctenophore Mnemiopsis leidyi'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:05:48,607 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:48,607 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 311, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:48,607 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:48,608 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:48,608 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:49,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:49,586 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:49,617 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:49,647 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:49,678 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:49,712 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:49,743 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:49,774 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:49,805 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:49,836 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:50,145 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5368211269378662 s; generated tokens: 20 tokens; generate speed: 13.013876273194025 tokens/s +2024-07-30 14:05:50,150 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:50,150 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[834/2067], cost time 1.5481s, every example cost time is 1.5481, generate speed: 12.9191 tokens/s, avg speed: 10.4684 tokens/s, remaining time: 0:28:15 +pred is: + ['1'] + label is: + ['Because of their soft, gelatinous bodies'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:05:50,232 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:50,232 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:50,232 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:50,233 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:50,233 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:51,176 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:51,209 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:51,240 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:51,271 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:51,303 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:51,334 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:51,337 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1037399768829346 s; generated tokens: 6 tokens; generate speed: 5.436062954740993 tokens/s +2024-07-30 14:05:51,342 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:51,342 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[835/2067], cost time 1.1151s, every example cost time is 1.1151, generate speed: 5.3807 tokens/s, avg speed: 10.4635 tokens/s, remaining time: 0:28:13 +pred is: + ['515 million years old'] + label is: + ['515 million years'] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +2024-07-30 14:05:51,424 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:51,424 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 382, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:51,424 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:51,425 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:51,425 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:52,371 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:52,404 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:52,435 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:52,466 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:52,497 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:52,528 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:52,559 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:52,591 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:52,622 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:52,653 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:52,963 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5381522178649902 s; generated tokens: 20 tokens; generate speed: 13.002614284664693 tokens/s +2024-07-30 14:05:52,968 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:52,968 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[836/2067], cost time 1.5495s, every example cost time is 1.5495, generate speed: 12.9073 tokens/s, avg speed: 10.4668 tokens/s, remaining time: 0:28:12 +pred is: + ['all other animal phyla'] + label is: + ['all other animals'] +The F1/Em of this example is: {'F1': 66.66666666666666, 'Em': 0.0} +2024-07-30 14:05:53,051 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:53,051 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 397, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:53,052 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:53,052 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:53,052 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:53,999 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:54,033 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:54,065 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:54,096 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:54,127 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:54,158 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:54,189 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:54,220 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:54,251 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:54,281 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:54,315 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.262427568435669 s; generated tokens: 11 tokens; generate speed: 8.713371186618332 tokens/s +2024-07-30 14:05:54,319 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:54,320 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[837/2067], cost time 1.2736s, every example cost time is 1.2736, generate speed: 8.6368 tokens/s, avg speed: 10.4647 tokens/s, remaining time: 0:28:11 +pred is: + ['1'] + label is: + ['beroids'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:05:54,402 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:54,402 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 224, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:54,402 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:54,403 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:54,403 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:55,347 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:55,380 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:55,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:55,442 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:55,473 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:55,504 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:55,535 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:55,538 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1344928741455078 s; generated tokens: 7 tokens; generate speed: 6.170157750239156 tokens/s +2024-07-30 14:05:55,542 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:55,543 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[838/2067], cost time 1.1458s, every example cost time is 1.1458, generate speed: 6.1095 tokens/s, avg speed: 10.4604 tokens/s, remaining time: 0:28:09 +pred is: + ['Fresno'] + label is: + ['Fresno'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:05:55,625 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:55,625 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 160, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:55,625 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:55,626 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:55,626 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:56,569 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:56,602 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:56,634 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:56,665 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:56,696 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:56,727 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:56,758 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:56,789 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:56,819 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:56,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:56,853 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2267823219299316 s; generated tokens: 10 tokens; generate speed: 8.151405364456462 tokens/s +2024-07-30 14:05:56,858 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:56,858 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[839/2067], cost time 1.2380s, every example cost time is 1.2380, generate speed: 8.0777 tokens/s, avg speed: 10.4579 tokens/s, remaining time: 0:28:07 +pred is: + ['1872'] + label is: + ['1872'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:05:56,945 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:56,945 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 188, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:56,946 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:56,946 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:56,946 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:57,889 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:57,923 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:57,954 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:57,985 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:58,016 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:58,047 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:58,079 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:58,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:58,167 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:58,198 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:58,264 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3178248405456543 s; generated tokens: 12 tokens; generate speed: 9.105914254151802 tokens/s +2024-07-30 14:05:58,269 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:58,269 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[840/2067], cost time 1.3296s, every example cost time is 1.3296, generate speed: 9.0254 tokens/s, avg speed: 10.4562 tokens/s, remaining time: 0:28:06 +pred is: + ['2.7'] + label is: + ['2.7%'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 61.75638914522643, Em score: 48.214285714285715, current_count: 840 +2024-07-30 14:05:58,594 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:58,595 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 158, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:58,595 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:58,595 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:58,596 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:05:59,540 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:59,573 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:59,627 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:59,660 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:59,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:59,699 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1035468578338623 s; generated tokens: 5 tokens; generate speed: 4.530845214687516 tokens/s +2024-07-30 14:05:59,708 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:05:59,708 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[841/2067], cost time 1.1190s, every example cost time is 1.1190, generate speed: 4.4684 tokens/s, avg speed: 10.4504 tokens/s, remaining time: 0:28:04 +pred is: + ['BankAmericard'] + label is: + ['BankAmericard'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:05:59,792 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:05:59,792 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 169, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:05:59,793 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:05:59,793 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:05:59,793 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:00,736 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:00,769 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:00,800 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:00,831 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:00,863 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:00,866 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0725195407867432 s; generated tokens: 5 tokens; generate speed: 4.661919722536958 tokens/s +2024-07-30 14:06:00,870 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:00,871 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[842/2067], cost time 1.0837s, every example cost time is 1.0837, generate speed: 4.6139 tokens/s, avg speed: 10.4449 tokens/s, remaining time: 0:28:02 +pred is: + ['Bill Aken'] + label is: + ['Bill Aken'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:06:00,953 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:00,953 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 183, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:00,953 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:00,954 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:00,954 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:01,897 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:01,931 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:01,963 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:01,966 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0119187831878662 s; generated tokens: 3 tokens; generate speed: 2.9646648029884823 tokens/s +2024-07-30 14:06:01,971 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:01,971 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[843/2067], cost time 1.0230s, every example cost time is 1.0230, generate speed: 2.9325 tokens/s, avg speed: 10.4383 tokens/s, remaining time: 0:28:00 +pred is: + ['3'] + label is: + ['three'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:06:02,053 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:02,053 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 157, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:02,053 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:02,053 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:02,054 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:02,997 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:03,030 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:03,062 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:03,093 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:03,124 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:03,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:03,187 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:03,218 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:03,250 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:03,281 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:03,594 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5398187637329102 s; generated tokens: 20 tokens; generate speed: 12.988541555056091 tokens/s +2024-07-30 14:06:03,599 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:03,599 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[844/2067], cost time 1.5512s, every example cost time is 1.5512, generate speed: 12.8936 tokens/s, avg speed: 10.4416 tokens/s, remaining time: 0:27:59 +pred is: + ['Between the 1880s and World War II'] + label is: + ['Between the 1880s and World War II'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:06:03,682 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:03,682 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 206, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:03,682 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:03,683 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:03,683 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:04,626 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:04,659 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:04,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:04,722 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:04,754 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:04,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:04,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:04,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:04,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:04,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:05,253 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5700371265411377 s; generated tokens: 20 tokens; generate speed: 12.738552268544693 tokens/s +2024-07-30 14:06:05,258 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:05,258 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[845/2067], cost time 1.5813s, every example cost time is 1.5813, generate speed: 12.6478 tokens/s, avg speed: 10.4446 tokens/s, remaining time: 0:27:58 +pred is: + ['1964'] + label is: + ['1964'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:06:05,340 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:05,341 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 171, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:05,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:05,341 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:05,342 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:06,285 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:06,318 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:06,349 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:06,380 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:06,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:06,441 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:06,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:06,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:06,534 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:06,565 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:06,872 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5302987098693848 s; generated tokens: 20 tokens; generate speed: 13.06934382876599 tokens/s +2024-07-30 14:06:06,877 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:06,877 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[846/2067], cost time 1.5415s, every example cost time is 1.5415, generate speed: 12.9745 tokens/s, avg speed: 10.4479 tokens/s, remaining time: 0:27:57 +pred is: + ["On Fresno's far southeast side, bounded by Chestnut Avenue to the West."] + label is: + ["Fresno's far southeast side"] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:06:06,961 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:06,961 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 250, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:06,961 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:06,962 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:06,962 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:07,905 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:07,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:07,969 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:08,000 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:08,031 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:08,062 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:08,092 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:08,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:08,154 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:08,184 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:08,248 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2861988544464111 s; generated tokens: 12 tokens; generate speed: 9.329817048519207 tokens/s +2024-07-30 14:06:08,253 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:08,253 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[847/2067], cost time 1.2975s, every example cost time is 1.2975, generate speed: 9.2488 tokens/s, avg speed: 10.4466 tokens/s, remaining time: 0:27:56 +pred is: + ['1'] + label is: + ['Tower Theatre'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:06:08,335 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:08,335 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 217, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:08,336 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:08,336 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:08,336 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:09,280 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:09,313 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:09,367 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:09,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:09,429 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:09,461 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:09,502 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:09,533 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:09,565 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:09,595 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:09,905 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5688941478729248 s; generated tokens: 20 tokens; generate speed: 12.747832622816267 tokens/s +2024-07-30 14:06:09,910 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:09,910 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[848/2067], cost time 1.5803s, every example cost time is 1.5803, generate speed: 12.6562 tokens/s, avg speed: 10.4496 tokens/s, remaining time: 0:27:54 +pred is: + ['late 1970s'] + label is: + ['late 1970s'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:06:09,992 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:09,992 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 153, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:09,993 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:09,993 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:09,993 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:10,936 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:10,968 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:11,000 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:11,031 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:11,033 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0399963855743408 s; generated tokens: 4 tokens; generate speed: 3.846167213159101 tokens/s +2024-07-30 14:06:11,038 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:11,038 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[849/2067], cost time 1.0512s, every example cost time is 1.0512, generate speed: 3.8053 tokens/s, avg speed: 10.4436 tokens/s, remaining time: 0:27:53 +pred is: + ['Live theater'] + label is: + ['live theater'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:06:11,120 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:11,120 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 145, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:11,120 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:11,121 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:11,121 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:12,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:12,097 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:12,128 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:12,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:12,190 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:12,220 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:12,251 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:12,281 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:12,312 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:12,343 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:12,652 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5308687686920166 s; generated tokens: 20 tokens; generate speed: 13.064477118497962 tokens/s +2024-07-30 14:06:12,657 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:12,657 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[850/2067], cost time 1.5422s, every example cost time is 1.5422, generate speed: 12.9688 tokens/s, avg speed: 10.4470 tokens/s, remaining time: 0:27:52 +pred is: + ['California Bungalow and American Craftsman style homes'] + label is: + ['early twentieth century homes'] +The F1/Em of this example is: {'F1': 20.0, 'Em': 0.0} +F1 score: 61.81807868469436, Em score: 48.35294117647059, current_count: 850 +2024-07-30 14:06:12,968 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:12,968 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 363, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:12,968 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:12,969 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:12,969 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:13,914 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:13,946 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:13,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:14,009 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:14,039 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:14,070 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:14,101 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:14,132 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:14,163 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:14,194 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:14,504 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5354979038238525 s; generated tokens: 20 tokens; generate speed: 13.025091047141109 tokens/s +2024-07-30 14:06:14,509 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:14,510 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[851/2067], cost time 1.5470s, every example cost time is 1.5470, generate speed: 12.9279 tokens/s, avg speed: 10.4502 tokens/s, remaining time: 0:27:50 +pred is: + ['Huntington Boulevard'] + label is: + ['Huntington Boulevard'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:06:14,591 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:14,592 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:14,592 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:14,592 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:14,593 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:15,536 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:15,569 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:15,600 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:15,631 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:15,661 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:15,664 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.071720838546753 s; generated tokens: 5 tokens; generate speed: 4.665394028150064 tokens/s +2024-07-30 14:06:15,669 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:15,670 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[852/2067], cost time 1.0829s, every example cost time is 1.0829, generate speed: 4.6172 tokens/s, avg speed: 10.4448 tokens/s, remaining time: 0:27:49 +pred is: + ['Southwest Fresno'] + label is: + ['"Southwest Fresno"'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:06:15,781 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:15,782 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 227, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:15,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:15,782 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:15,783 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:16,727 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:16,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:16,792 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:16,823 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:16,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:16,885 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:16,915 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:16,947 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:16,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:17,008 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:17,340 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5571284294128418 s; generated tokens: 20 tokens; generate speed: 12.844155704961056 tokens/s +2024-07-30 14:06:17,345 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:17,345 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[853/2067], cost time 1.5691s, every example cost time is 1.5691, generate speed: 12.7464 tokens/s, avg speed: 10.4479 tokens/s, remaining time: 0:27:48 +pred is: + ['M. Theo Kearney'] + label is: + ['M. Theo Kearney'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:06:17,427 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:17,428 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 324, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:17,428 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:17,428 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:17,429 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:18,374 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:18,407 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:18,439 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:18,470 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:18,502 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:18,533 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:18,564 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:18,595 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:18,626 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:18,657 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:18,965 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.53633451461792 s; generated tokens: 20 tokens; generate speed: 13.01799823521762 tokens/s +2024-07-30 14:06:18,970 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:18,970 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[854/2067], cost time 1.5476s, every example cost time is 1.5476, generate speed: 12.9233 tokens/s, avg speed: 10.4512 tokens/s, remaining time: 0:27:46 +pred is: + ['1960s'] + label is: + ['between the 1960s and 1990s'] +The F1/Em of this example is: {'F1': 20.0, 'Em': 0.0} +2024-07-30 14:06:19,053 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:19,053 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 451, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:19,054 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:19,054 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:19,054 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:20,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:20,035 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:20,066 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:20,070 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0152111053466797 s; generated tokens: 3 tokens; generate speed: 2.955050416805226 tokens/s +2024-07-30 14:06:20,074 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:20,075 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[855/2067], cost time 1.0264s, every example cost time is 1.0264, generate speed: 2.9228 tokens/s, avg speed: 10.4446 tokens/s, remaining time: 0:27:45 +pred is: + ['Ralph Woodward'] + label is: + ['Ralph Woodward'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:06:20,156 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:20,156 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 148, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:20,157 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:20,157 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:20,157 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:21,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:21,133 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:21,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:21,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:21,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:21,257 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:21,287 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:21,318 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:21,349 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:21,379 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:21,719 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.561002492904663 s; generated tokens: 20 tokens; generate speed: 12.812279346706644 tokens/s +2024-07-30 14:06:21,723 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:21,724 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[856/2067], cost time 1.5723s, every example cost time is 1.5723, generate speed: 12.7204 tokens/s, avg speed: 10.4476 tokens/s, remaining time: 0:27:43 +pred is: + ['1946'] + label is: + ['1946'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:06:21,806 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:21,806 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 415, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:21,806 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:21,807 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:21,807 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:22,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:22,786 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:22,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:22,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:22,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:22,882 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0748772621154785 s; generated tokens: 5 tokens; generate speed: 4.651693896807754 tokens/s +2024-07-30 14:06:22,887 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:22,887 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[857/2067], cost time 1.0861s, every example cost time is 1.0861, generate speed: 4.6037 tokens/s, avg speed: 10.4423 tokens/s, remaining time: 0:27:42 +pred is: + ['Hot and dry'] + label is: + ['hot and dry'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:06:22,969 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:22,969 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 330, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:22,970 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:22,970 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:22,970 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:23,915 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:23,948 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:23,979 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:24,010 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:24,041 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:24,072 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:24,103 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:24,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:24,165 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:24,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:24,383 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4122862815856934 s; generated tokens: 16 tokens; generate speed: 11.329147785840874 tokens/s +2024-07-30 14:06:24,388 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:24,388 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[858/2067], cost time 1.4236s, every example cost time is 1.4236, generate speed: 11.2395 tokens/s, avg speed: 10.4432 tokens/s, remaining time: 0:27:40 +pred is: + ['115 °F (46.1 °C)'] + label is: + ['115 °F'] +The F1/Em of this example is: {'F1': 53.333333333333336, 'Em': 0.0} +2024-07-30 14:06:24,470 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:24,471 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 337, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:24,471 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:24,471 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:24,472 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:25,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:25,450 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:25,481 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:25,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:25,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:25,574 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:25,605 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:25,635 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:25,666 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:25,697 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:26,005 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5333640575408936 s; generated tokens: 20 tokens; generate speed: 13.04321690706293 tokens/s +2024-07-30 14:06:26,010 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:26,010 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[859/2067], cost time 1.5447s, every example cost time is 1.5447, generate speed: 12.9471 tokens/s, avg speed: 10.4465 tokens/s, remaining time: 0:27:39 +pred is: + ['494,665'] + label is: + ['494,665'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:06:26,093 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:26,093 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 247, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:26,093 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:26,094 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:26,094 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:27,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:27,071 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:27,103 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:27,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:27,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:27,167 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0733323097229004 s; generated tokens: 5 tokens; generate speed: 4.658389535754158 tokens/s +2024-07-30 14:06:27,172 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:27,172 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[860/2067], cost time 1.0844s, every example cost time is 1.0844, generate speed: 4.6108 tokens/s, avg speed: 10.4411 tokens/s, remaining time: 0:27:37 +pred is: + ['68,511'] + label is: + ['68,511'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.08569792479482, Em score: 48.604651162790695, current_count: 860 +2024-07-30 14:06:27,512 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:27,512 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 235, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:27,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:27,513 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:27,513 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:28,457 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:28,489 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:28,544 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:28,575 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:28,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:28,637 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:28,668 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:28,698 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:28,729 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:28,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:29,069 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5559065341949463 s; generated tokens: 20 tokens; generate speed: 12.854242565636088 tokens/s +2024-07-30 14:06:29,074 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:29,074 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[861/2067], cost time 1.5678s, every example cost time is 1.5678, generate speed: 12.7566 tokens/s, avg speed: 10.4442 tokens/s, remaining time: 0:27:36 +pred is: + ['427,652'] + label is: + ['427,652'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:06:29,156 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:29,156 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 203, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:29,157 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:29,157 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:29,157 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:30,101 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:30,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:30,165 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:30,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:30,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:30,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:30,288 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:30,319 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:30,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:30,381 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:30,690 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5325498580932617 s; generated tokens: 20 tokens; generate speed: 13.050146391245772 tokens/s +2024-07-30 14:06:30,695 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:30,695 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[862/2067], cost time 1.5438s, every example cost time is 1.5438, generate speed: 12.9546 tokens/s, avg speed: 10.4475 tokens/s, remaining time: 0:27:35 +pred is: + ['1'] + label is: + ['To avoid interference with existing VHF television stations'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:06:30,778 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:30,779 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 168, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:30,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:30,779 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:30,779 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:31,722 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:31,755 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:31,786 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:31,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:31,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:31,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:31,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:31,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:31,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:32,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:32,336 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5561745166778564 s; generated tokens: 20 tokens; generate speed: 12.852028988815654 tokens/s +2024-07-30 14:06:32,341 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:32,341 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[863/2067], cost time 1.5675s, every example cost time is 1.5675, generate speed: 12.7588 tokens/s, avg speed: 10.4505 tokens/s, remaining time: 0:27:34 +pred is: + ['State Route 99'] + label is: + ['State Route 99'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:06:32,424 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:32,424 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 199, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:32,424 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:32,424 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:32,425 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:33,368 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:33,402 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:33,433 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:33,464 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:33,495 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:33,526 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:33,557 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:33,560 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1347215175628662 s; generated tokens: 7 tokens; generate speed: 6.16891447959361 tokens/s +2024-07-30 14:06:33,565 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:33,565 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[864/2067], cost time 1.1462s, every example cost time is 1.1462, generate speed: 6.1073 tokens/s, avg speed: 10.4463 tokens/s, remaining time: 0:27:32 +pred is: + ['Fresno'] + label is: + ['Fresno'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:06:33,647 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:33,647 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 154, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:33,648 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:33,648 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:33,648 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:34,591 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:34,624 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:34,655 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:34,686 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:34,717 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:34,748 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:34,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:34,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:34,813 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1642282009124756 s; generated tokens: 8 tokens; generate speed: 6.871505082706225 tokens/s +2024-07-30 14:06:34,817 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:34,817 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[865/2067], cost time 1.1760s, every example cost time is 1.1760, generate speed: 6.8030 tokens/s, avg speed: 10.4427 tokens/s, remaining time: 0:27:31 +pred is: + ['Amtrak San Joaquins'] + label is: + ['Amtrak San Joaquins'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:06:34,900 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:34,900 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 219, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:34,901 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:34,901 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:34,901 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:35,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:35,877 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:35,909 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:35,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:35,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:36,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:36,033 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:36,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:36,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:36,125 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:36,440 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.53818678855896 s; generated tokens: 20 tokens; generate speed: 13.00232205136599 tokens/s +2024-07-30 14:06:36,444 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:36,445 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[866/2067], cost time 1.5493s, every example cost time is 1.5493, generate speed: 12.9088 tokens/s, avg speed: 10.4459 tokens/s, remaining time: 0:27:30 +pred is: + ['The concept Distributed Adaptive Message Block Switching'] + label is: + ['Paul Baran developed the concept Distributed Adaptive Message Block Switching'] +The F1/Em of this example is: {'F1': 81.25000000000001, 'Em': 0.0} +2024-07-30 14:06:36,528 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:36,528 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 143, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:36,528 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:36,529 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:36,529 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:37,471 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:37,510 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:37,541 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:37,572 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:37,603 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:37,634 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:37,637 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1076641082763672 s; generated tokens: 6 tokens; generate speed: 5.416804566626775 tokens/s +2024-07-30 14:06:37,641 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:37,642 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[867/2067], cost time 1.1188s, every example cost time is 1.1188, generate speed: 5.3628 tokens/s, avg speed: 10.4412 tokens/s, remaining time: 0:27:28 +pred is: + ['Circuit Switching'] + label is: + ['circuit switching'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:06:37,725 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:37,725 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 147, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:37,725 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:37,726 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:37,726 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:38,667 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:38,699 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:38,731 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:38,763 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:38,794 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:38,825 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:38,855 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:38,886 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:38,889 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.163487434387207 s; generated tokens: 8 tokens; generate speed: 6.875880016885176 tokens/s +2024-07-30 14:06:38,894 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:38,894 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[868/2067], cost time 1.1746s, every example cost time is 1.1746, generate speed: 6.8109 tokens/s, avg speed: 10.4376 tokens/s, remaining time: 0:27:26 +pred is: + ['With or without intermediate forwarding nodes'] + label is: + ['with or without intermediate forwarding nodes'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:06:38,978 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:38,978 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 187, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:38,978 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:38,979 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:38,979 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:39,922 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:39,955 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:39,987 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:40,018 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:40,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:40,081 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:40,112 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:40,143 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:40,146 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.167210578918457 s; generated tokens: 8 tokens; generate speed: 6.853947474853114 tokens/s +2024-07-30 14:06:40,151 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:40,151 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[869/2067], cost time 1.1784s, every example cost time is 1.1784, generate speed: 6.7891 tokens/s, avg speed: 10.4340 tokens/s, remaining time: 0:27:25 +pred is: + ['Distributed adaptive message block switching'] + label is: + ['the concept of distributed adaptive message block switching'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:06:40,234 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:40,234 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 170, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:40,235 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:40,235 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:40,235 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:41,178 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:41,211 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:41,243 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:41,273 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:41,305 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:41,308 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0722839832305908 s; generated tokens: 5 tokens; generate speed: 4.662943845282419 tokens/s +2024-07-30 14:06:41,312 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:41,313 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[870/2067], cost time 1.0834s, every example cost time is 1.0834, generate speed: 4.6151 tokens/s, avg speed: 10.4287 tokens/s, remaining time: 0:27:23 +pred is: + ['Packet Switching'] + label is: + ['independently developed the same message routing methodology as developed by Baran'] +The F1/Em of this example is: {'F1': 8.333333333333332, 'Em': 0.0} +F1 score: 62.25090063064009, Em score: 48.735632183908045, current_count: 870 +2024-07-30 14:06:41,629 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:41,629 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 272, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:41,630 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:41,630 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:41,630 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:42,574 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:42,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:42,640 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:42,671 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:42,702 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:42,705 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0744118690490723 s; generated tokens: 5 tokens; generate speed: 4.653708828091541 tokens/s +2024-07-30 14:06:42,710 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:42,710 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[871/2067], cost time 1.0856s, every example cost time is 1.0856, generate speed: 4.6056 tokens/s, avg speed: 10.4234 tokens/s, remaining time: 0:27:21 +pred is: + ['complete addressing information'] + label is: + ['each packet includes complete addressing information'] +The F1/Em of this example is: {'F1': 62.5, 'Em': 0.0} +2024-07-30 14:06:42,793 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:42,794 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 214, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:42,794 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:42,794 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:42,795 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:43,738 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:43,770 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:43,801 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:43,805 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.009883165359497 s; generated tokens: 3 tokens; generate speed: 2.970640667063762 tokens/s +2024-07-30 14:06:43,809 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:43,810 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[872/2067], cost time 1.0210s, every example cost time is 1.0210, generate speed: 2.9382 tokens/s, avg speed: 10.4170 tokens/s, remaining time: 0:27:19 +pred is: + ['No'] + label is: + ['The packet header can be small, as it only needs to contain this code and any information, such as length, timestamp, or sequence number'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:06:43,898 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:43,898 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 764, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:43,899 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:43,899 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:43,899 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:44,846 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:44,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:44,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:44,943 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:44,975 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:45,006 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:45,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:45,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:45,101 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:45,132 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:45,448 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5489966869354248 s; generated tokens: 20 tokens; generate speed: 12.91158345830198 tokens/s +2024-07-30 14:06:45,453 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:45,453 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[873/2067], cost time 1.5605s, every example cost time is 1.5605, generate speed: 12.8160 tokens/s, avg speed: 10.4202 tokens/s, remaining time: 0:27:18 +pred is: + ['Connection-oriented operations'] + label is: + ['connection-oriented operations. But X.25 does it at the network layer of the OSI Model. Frame Relay does it at level two, the data link layer'] +The F1/Em of this example is: {'F1': 10.90909090909091, 'Em': 0.0} +2024-07-30 14:06:45,538 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:45,538 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 189, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:45,538 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:45,539 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:45,539 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:46,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:46,514 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:46,546 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:46,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:46,580 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0409343242645264 s; generated tokens: 4 tokens; generate speed: 3.8427016063921284 tokens/s +2024-07-30 14:06:46,584 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:46,585 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[874/2067], cost time 1.0520s, every example cost time is 1.0520, generate speed: 3.8022 tokens/s, avg speed: 10.4144 tokens/s, remaining time: 0:27:16 +pred is: + ['1969'] + label is: + ['1969'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:06:46,666 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:46,666 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 140, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:46,667 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:46,667 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:46,667 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:47,609 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:47,641 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:47,672 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:47,703 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:47,735 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:47,765 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:47,796 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:47,827 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:47,857 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:47,888 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:48,197 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5295984745025635 s; generated tokens: 20 tokens; generate speed: 13.075326847788695 tokens/s +2024-07-30 14:06:48,202 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:48,202 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[875/2067], cost time 1.5407s, every example cost time is 1.5407, generate speed: 12.9809 tokens/s, avg speed: 10.4177 tokens/s, remaining time: 0:27:15 +pred is: + ['A proprietary suite of networking protocols developed by Apple Inc. in 1985 for Apple Macintosh'] + label is: + ['a proprietary suite of networking protocols developed by Apple Inc. in 1985'] +The F1/Em of this example is: {'F1': 88.8888888888889, 'Em': 0.0} +2024-07-30 14:06:48,285 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:48,286 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 139, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:48,286 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:48,286 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:48,287 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:49,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:49,262 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:49,293 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:49,325 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:49,356 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:49,388 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:49,391 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1041715145111084 s; generated tokens: 6 tokens; generate speed: 5.433938406440966 tokens/s +2024-07-30 14:06:49,396 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:49,396 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[876/2067], cost time 1.1154s, every example cost time is 1.1154, generate speed: 5.3794 tokens/s, avg speed: 10.4130 tokens/s, remaining time: 0:27:13 +pred is: + ['CYCLADES'] + label is: + ['CYCLADES packet switching network'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 14:06:49,478 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:49,478 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 170, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:49,479 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:49,479 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:49,479 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:50,422 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:50,455 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:50,486 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:50,517 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:50,548 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:50,579 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:50,610 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:50,613 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1335220336914062 s; generated tokens: 7 tokens; generate speed: 6.175442375128725 tokens/s +2024-07-30 14:06:50,618 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:50,618 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[877/2067], cost time 1.1447s, every example cost time is 1.1447, generate speed: 6.1154 tokens/s, avg speed: 10.4089 tokens/s, remaining time: 0:27:12 +pred is: + ['A suite of network protocols'] + label is: + ['a suite of network protocols created by Digital Equipment Corporation'] +The F1/Em of this example is: {'F1': 64.28571428571429, 'Em': 0.0} +2024-07-30 14:06:50,701 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:50,701 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 191, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:50,701 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:50,702 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:50,702 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:51,645 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:51,677 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:51,709 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:51,740 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:51,771 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:51,802 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:51,833 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:51,836 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1339232921600342 s; generated tokens: 7 tokens; generate speed: 6.173257087492712 tokens/s +2024-07-30 14:06:51,841 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:51,841 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[878/2067], cost time 1.1451s, every example cost time is 1.1451, generate speed: 6.1132 tokens/s, avg speed: 10.4048 tokens/s, remaining time: 0:27:10 +pred is: + ['a high-level marketing manager'] + label is: + ["a data network based on this voice-phone network was designed to connect GE's four computer sales and service centers"] +The F1/Em of this example is: {'F1': 8.695652173913043, 'Em': 0.0} +2024-07-30 14:06:51,925 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:51,925 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 312, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:51,925 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:51,926 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:51,926 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:52,871 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:52,904 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:52,935 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:52,966 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:52,997 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:53,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:53,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:53,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:53,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:53,162 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:53,473 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.547135353088379 s; generated tokens: 20 tokens; generate speed: 12.927117178258621 tokens/s +2024-07-30 14:06:53,478 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:53,478 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[879/2067], cost time 1.5583s, every example cost time is 1.5583, generate speed: 12.8347 tokens/s, avg speed: 10.4079 tokens/s, remaining time: 0:27:09 +pred is: + ["to explore computer networking between three of Michigan's public universities as a means to help the state's"] + label is: + ["as a means to help the state's educational and economic development"] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:06:53,561 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:53,562 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 198, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:53,562 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:53,562 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:53,562 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:54,506 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:54,540 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:54,572 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:54,605 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:54,636 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:54,667 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:54,671 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.108124017715454 s; generated tokens: 6 tokens; generate speed: 5.414556407115697 tokens/s +2024-07-30 14:06:54,675 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:54,676 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[880/2067], cost time 1.1192s, every example cost time is 1.1192, generate speed: 5.3608 tokens/s, avg speed: 10.4033 tokens/s, remaining time: 0:27:07 +pred is: + ['A public data network'] + label is: + ['the first FCC-licensed public data network in the United States'] +The F1/Em of this example is: {'F1': 46.15384615384615, 'Em': 0.0} +F1 score: 62.062178114850376, Em score: 48.29545454545455, current_count: 880 +2024-07-30 14:06:55,001 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:55,001 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 227, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:55,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:55,002 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:55,002 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:55,946 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:55,978 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:56,015 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:56,047 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:56,078 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:56,109 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:56,141 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:56,172 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:56,203 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:56,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:56,544 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.541027307510376 s; generated tokens: 20 tokens; generate speed: 12.9783553494008 tokens/s +2024-07-30 14:06:56,548 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:56,549 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[881/2067], cost time 1.5524s, every example cost time is 1.5524, generate speed: 12.8835 tokens/s, avg speed: 10.4064 tokens/s, remaining time: 0:27:06 +pred is: + ['An international data communications network headquartered in San Jose, CA that utilized virtual call packet switched technology and'] + label is: + ['an international data communications network headquartered in San Jose, CA'] +The F1/Em of this example is: {'F1': 71.42857142857143, 'Em': 0.0} +2024-07-30 14:06:56,632 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:56,633 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 209, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:56,633 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:56,633 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:56,633 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:57,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:57,610 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:57,641 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:57,644 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0105352401733398 s; generated tokens: 3 tokens; generate speed: 2.9687237819488628 tokens/s +2024-07-30 14:06:57,649 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:57,649 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[882/2067], cost time 1.0216s, every example cost time is 1.0216, generate speed: 2.9366 tokens/s, avg speed: 10.4001 tokens/s, remaining time: 0:27:04 +pred is: + ['Two'] + label is: + ['There were two kinds of X.25 networks. Some such as DATAPAC and TRANSPAC'] +The F1/Em of this example is: {'F1': 7.4074074074074066, 'Em': 0.0} +2024-07-30 14:06:57,731 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:57,732 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 172, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:57,732 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:57,732 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:57,732 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:58,675 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:58,708 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:58,741 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:58,772 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:58,803 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:58,834 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:58,864 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:58,895 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:58,898 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1654794216156006 s; generated tokens: 8 tokens; generate speed: 6.864128058915283 tokens/s +2024-07-30 14:06:58,903 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:06:58,903 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[883/2067], cost time 1.1766s, every example cost time is 1.1766, generate speed: 6.7995 tokens/s, avg speed: 10.3966 tokens/s, remaining time: 0:27:03 +pred is: + ['A public X.25 network'] + label is: + ['AUSTPAC was an Australian public X.25 network operated by Telstra'] +The F1/Em of this example is: {'F1': 46.15384615384615, 'Em': 0.0} +2024-07-30 14:06:58,986 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:06:58,986 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 183, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:06:58,986 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:58,987 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:06:58,987 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:06:59,929 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:59,962 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:06:59,994 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:00,025 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:00,056 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:00,086 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:00,117 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:00,148 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:00,179 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:00,210 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:00,523 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.535534143447876 s; generated tokens: 20 tokens; generate speed: 13.024783646355242 tokens/s +2024-07-30 14:07:00,527 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:00,528 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[884/2067], cost time 1.5467s, every example cost time is 1.5467, generate speed: 12.9305 tokens/s, avg speed: 10.3999 tokens/s, remaining time: 0:27:01 +pred is: + ['The public switched data network operated by the Dutch PTT Telecom (now known as KPN)'] + label is: + ['was the public switched data network operated by the Dutch PTT Telecom'] +The F1/Em of this example is: {'F1': 77.77777777777777, 'Em': 0.0} +2024-07-30 14:07:00,612 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:00,612 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 142, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:00,613 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:00,613 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:00,613 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:01,556 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:01,590 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:01,621 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:01,657 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:01,689 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:01,720 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:01,750 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:01,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:01,813 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:01,844 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:02,152 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5388462543487549 s; generated tokens: 20 tokens; generate speed: 12.996749963474466 tokens/s +2024-07-30 14:07:02,157 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:02,157 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[885/2067], cost time 1.5501s, every example cost time is 1.5501, generate speed: 12.9022 tokens/s, avg speed: 10.4031 tokens/s, remaining time: 0:27:00 +pred is: + ['A computer network'] + label is: + ['The Computer Science Network'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:07:02,240 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:02,241 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 182, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:02,241 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:02,241 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:02,241 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:03,184 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:03,216 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:03,248 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:03,279 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:03,310 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:03,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:03,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:03,403 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:03,434 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:03,466 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:03,776 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.534052848815918 s; generated tokens: 20 tokens; generate speed: 13.03736048952766 tokens/s +2024-07-30 14:07:03,780 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:03,781 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[886/2067], cost time 1.5451s, every example cost time is 1.5451, generate speed: 12.9439 tokens/s, avg speed: 10.4063 tokens/s, remaining time: 0:26:59 +pred is: + ['a not-for-profit United States computer networking consortium led by members from the research and education communities,'] + label is: + ['a not-for-profit United States computer networking consortium led by members from the research and education communities, industry, and government'] +The F1/Em of this example is: {'F1': 90.14084507042254, 'Em': 0.0} +2024-07-30 14:07:03,866 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:03,866 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 183, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:03,866 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:03,867 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:03,867 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:04,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:04,843 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:04,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:04,905 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:04,936 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:04,967 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:04,998 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:05,029 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:05,060 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:05,091 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:05,401 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5341081619262695 s; generated tokens: 20 tokens; generate speed: 13.03689042035174 tokens/s +2024-07-30 14:07:05,406 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:05,406 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[887/2067], cost time 1.5453s, every example cost time is 1.5453, generate speed: 12.9427 tokens/s, avg speed: 10.4095 tokens/s, remaining time: 0:26:58 +pred is: + ['A program of coordinated, evolving projects sponsored by the National Science Foundation (NSF) beginning in'] + label is: + ['The National Science Foundation Network'] +The F1/Em of this example is: {'F1': 39.02439024390244, 'Em': 0.0} +2024-07-30 14:07:05,490 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:05,490 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 243, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:05,491 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:05,491 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:05,491 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:06,434 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:06,470 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:06,501 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:06,532 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:06,563 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:06,594 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:06,625 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:06,656 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:06,687 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:06,718 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:07,032 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5401301383972168 s; generated tokens: 20 tokens; generate speed: 12.985915606335453 tokens/s +2024-07-30 14:07:07,036 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:07,037 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[888/2067], cost time 1.5514s, every example cost time is 1.5514, generate speed: 12.8913 tokens/s, avg speed: 10.4127 tokens/s, remaining time: 0:26:57 +pred is: + ['Very high-speed Backbone Network Service'] + label is: + ['The Very high-speed Backbone Network Service'] +The F1/Em of this example is: {'F1': 90.0, 'Em': 0.0} +2024-07-30 14:07:07,121 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:07,121 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 195, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:07,122 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:07,122 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:07,122 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:08,065 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:08,098 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:08,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:08,160 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:08,163 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0409116744995117 s; generated tokens: 4 tokens; generate speed: 3.8427852218328407 tokens/s +2024-07-30 14:07:08,168 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:08,168 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[889/2067], cost time 1.0524s, every example cost time is 1.0524, generate speed: 3.8010 tokens/s, avg speed: 10.4070 tokens/s, remaining time: 0:26:55 +pred is: + ['Central Asia'] + label is: + ['the arid plains of Central Asia'] +The F1/Em of this example is: {'F1': 42.857142857142854, 'Em': 0.0} +2024-07-30 14:07:08,252 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:08,252 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 284, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:08,253 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:08,253 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:08,253 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:09,197 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:09,230 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:09,262 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:09,293 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:09,324 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:09,355 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:09,386 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:09,418 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:09,450 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:09,485 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:09,807 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5535979270935059 s; generated tokens: 20 tokens; generate speed: 12.873343643948019 tokens/s +2024-07-30 14:07:09,812 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:09,812 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[890/2067], cost time 1.5649s, every example cost time is 1.5649, generate speed: 12.7801 tokens/s, avg speed: 10.4100 tokens/s, remaining time: 0:26:54 +pred is: + ['(Correct)'] + label is: + ['commonly present'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 61.94326597978359, Em score: 47.752808988764045, current_count: 890 +2024-07-30 14:07:10,155 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:10,156 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:10,156 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:10,157 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:10,157 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:11,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:11,133 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:11,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:11,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:11,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:11,260 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:11,263 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1060636043548584 s; generated tokens: 6 tokens; generate speed: 5.42464282919757 tokens/s +2024-07-30 14:07:11,268 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:11,268 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[891/2067], cost time 1.1177s, every example cost time is 1.1177, generate speed: 5.3683 tokens/s, avg speed: 10.4054 tokens/s, remaining time: 0:26:52 +pred is: + ['Genoese traders'] + label is: + ['Genoese traders'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:07:11,351 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:11,352 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 183, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:11,352 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:11,352 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:11,352 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:12,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:12,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:12,360 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:12,392 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:12,395 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0420286655426025 s; generated tokens: 4 tokens; generate speed: 3.83866599093714 tokens/s +2024-07-30 14:07:12,399 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:12,400 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[892/2067], cost time 1.0531s, every example cost time is 1.0531, generate speed: 3.7982 tokens/s, avg speed: 10.3997 tokens/s, remaining time: 0:26:51 +pred is: + ['Northwest'] + label is: + ['northwest across Europe'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +2024-07-30 14:07:12,493 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:12,493 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 221, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:12,493 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:12,494 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:12,494 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:13,438 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:13,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:13,504 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:13,536 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:13,567 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:13,598 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:13,635 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:13,666 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:13,697 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:13,729 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:14,009 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5150601863861084 s; generated tokens: 19 tokens; generate speed: 12.540755918958528 tokens/s +2024-07-30 14:07:14,014 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:14,014 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[893/2067], cost time 1.5286s, every example cost time is 1.5286, generate speed: 12.4293 tokens/s, avg speed: 10.4022 tokens/s, remaining time: 0:26:49 +pred is: + ['It led to serious depopulation and permanent change in both economic and social structures.'] + label is: + ['serious depopulation and permanent change in both economic and social structures'] +The F1/Em of this example is: {'F1': 85.71428571428571, 'Em': 0.0} +2024-07-30 14:07:14,099 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:14,099 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 179, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:14,099 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:14,100 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:14,100 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:15,042 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:15,075 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:15,107 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:15,109 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0094516277313232 s; generated tokens: 3 tokens; generate speed: 2.971910607289132 tokens/s +2024-07-30 14:07:15,114 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:15,114 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[894/2067], cost time 1.0205s, every example cost time is 1.0205, generate speed: 2.9399 tokens/s, avg speed: 10.3960 tokens/s, remaining time: 0:26:48 +pred is: + ['Gasquet'] + label is: + ['Gasquet'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:07:15,195 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:15,196 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 195, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:15,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:15,196 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:15,196 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:16,140 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:16,173 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:16,204 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:16,236 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:16,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:16,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:16,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:16,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:16,391 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:16,422 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:16,671 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.474912166595459 s; generated tokens: 18 tokens; generate speed: 12.204116562106485 tokens/s +2024-07-30 14:07:16,676 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:16,677 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[895/2067], cost time 1.4861s, every example cost time is 1.4861, generate speed: 12.1125 tokens/s, avg speed: 10.3981 tokens/s, remaining time: 0:26:46 +pred is: + ['The heavens'] + label is: + ['the heavens'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:07:16,759 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:16,759 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 320, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:16,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:16,760 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:16,760 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:17,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:17,737 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:17,769 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:17,800 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:17,831 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:17,862 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:17,893 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:17,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:17,955 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:17,986 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:18,081 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3209404945373535 s; generated tokens: 13 tokens; generate speed: 9.841472839814122 tokens/s +2024-07-30 14:07:18,086 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:18,086 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[896/2067], cost time 1.3321s, every example cost time is 1.3321, generate speed: 9.7592 tokens/s, avg speed: 10.3974 tokens/s, remaining time: 0:26:45 +pred is: + ['Yersinia pestis'] + label is: + ['Yersinia pestis'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:07:18,168 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:18,168 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 163, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:18,169 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:18,169 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:18,169 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:19,112 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:19,144 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:19,175 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:19,206 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:19,237 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:19,268 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:19,299 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:19,330 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:19,333 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.16336989402771 s; generated tokens: 8 tokens; generate speed: 6.8765747171805796 tokens/s +2024-07-30 14:07:19,337 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:19,338 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[897/2067], cost time 1.1744s, every example cost time is 1.1744, generate speed: 6.8119 tokens/s, avg speed: 10.3940 tokens/s, remaining time: 0:26:43 +pred is: + ['Francis Aidan Gasquet'] + label is: + ['Francis Aidan Gasquet'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:07:19,420 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:19,420 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 266, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:19,420 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:19,421 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:19,421 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:20,366 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:20,399 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:20,430 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:20,461 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:20,492 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:20,523 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:20,554 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:20,585 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:20,616 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:20,647 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:20,958 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5372982025146484 s; generated tokens: 20 tokens; generate speed: 13.009837627654044 tokens/s +2024-07-30 14:07:20,963 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:20,963 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[898/2067], cost time 1.5485s, every example cost time is 1.5485, generate speed: 12.9153 tokens/s, avg speed: 10.3972 tokens/s, remaining time: 0:26:42 +pred is: + ['30-75%'] + label is: + ['30–75%'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:07:21,045 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:21,046 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 225, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:21,046 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:21,046 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:21,046 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:21,989 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:22,022 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:22,053 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:22,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:22,116 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:22,147 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:22,178 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:22,208 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:22,239 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:22,270 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:22,580 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5337340831756592 s; generated tokens: 20 tokens; generate speed: 13.040070126491015 tokens/s +2024-07-30 14:07:22,585 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:22,585 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[899/2067], cost time 1.5449s, every example cost time is 1.5449, generate speed: 12.9458 tokens/s, avg speed: 10.4004 tokens/s, remaining time: 0:26:41 +pred is: + ['October 2010'] + label is: + ['In October 2010'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:07:22,668 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:22,668 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 292, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:22,669 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:22,669 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:22,669 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:23,614 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:23,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:23,678 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:23,709 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:23,740 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:23,743 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0733466148376465 s; generated tokens: 5 tokens; generate speed: 4.658327450686837 tokens/s +2024-07-30 14:07:23,747 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:23,748 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[900/2067], cost time 1.0844s, every example cost time is 1.0844, generate speed: 4.6109 tokens/s, avg speed: 10.3953 tokens/s, remaining time: 0:26:39 +pred is: + ['Genetic branches'] + label is: + ['genetic branches'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.137282601172245, Em score: 47.888888888888886, current_count: 900 +2024-07-30 14:07:24,088 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:24,089 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 159, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:24,089 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:24,089 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:24,089 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:25,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:25,065 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:25,096 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:25,127 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:25,158 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:25,161 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.07163667678833 s; generated tokens: 5 tokens; generate speed: 4.6657604282310325 tokens/s +2024-07-30 14:07:25,166 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:25,166 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[901/2067], cost time 1.0830s, every example cost time is 1.0830, generate speed: 4.6169 tokens/s, avg speed: 10.3902 tokens/s, remaining time: 0:26:37 +pred is: + ['Confirmed and amended'] + label is: + ['confirmed and amended'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:07:25,248 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:25,249 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 187, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:25,249 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:25,249 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:25,249 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:26,193 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:26,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:26,257 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:26,288 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:26,319 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:26,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:26,381 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:26,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:26,442 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:26,473 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:26,722 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4727234840393066 s; generated tokens: 18 tokens; generate speed: 12.222253664775257 tokens/s +2024-07-30 14:07:26,727 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:26,727 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[902/2067], cost time 1.4839s, every example cost time is 1.4839, generate speed: 12.1303 tokens/s, avg speed: 10.3923 tokens/s, remaining time: 0:26:36 +pred is: + ['J. F. D. Shrewsbury'] + label is: + ['British bacteriologist J. F. D. Shrewsbury'] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +2024-07-30 14:07:26,810 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:26,811 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 148, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:26,811 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:26,811 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:26,812 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:27,754 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:27,787 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:27,818 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:27,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:27,881 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:27,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:27,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:27,976 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:28,008 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:28,039 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:28,348 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5364103317260742 s; generated tokens: 20 tokens; generate speed: 13.017355837181254 tokens/s +2024-07-30 14:07:28,353 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:28,353 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[903/2067], cost time 1.5477s, every example cost time is 1.5477, generate speed: 12.9220 tokens/s, avg speed: 10.3955 tokens/s, remaining time: 0:26:35 +pred is: + ['1'] + label is: + ['epidemiological account of the plague'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:07:28,436 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:28,437 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 288, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:28,437 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:28,437 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:28,438 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:29,383 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:29,416 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:29,447 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:29,491 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:29,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:29,554 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:29,585 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:29,617 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:29,649 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:29,682 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:30,002 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5637903213500977 s; generated tokens: 20 tokens; generate speed: 12.789438409321404 tokens/s +2024-07-30 14:07:30,006 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:30,007 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[904/2067], cost time 1.5752s, every example cost time is 1.5752, generate speed: 12.6968 tokens/s, avg speed: 10.3984 tokens/s, remaining time: 0:26:34 +pred is: + ['Because the symptoms of the Black Death are not unique (and arguably in some accounts may differ from'] + label is: + ['the rat population was insufficient'] +The F1/Em of this example is: {'F1': 8.888888888888888, 'Em': 0.0} +2024-07-30 14:07:30,091 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:30,091 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 373, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:30,092 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:30,092 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:30,092 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:31,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:31,071 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:31,103 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:31,135 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:31,166 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:31,197 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:31,228 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:31,259 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:31,290 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:31,321 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:31,480 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3874175548553467 s; generated tokens: 15 tokens; generate speed: 10.811453226540667 tokens/s +2024-07-30 14:07:31,485 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:31,485 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[905/2067], cost time 1.3992s, every example cost time is 1.3992, generate speed: 10.7207 tokens/s, avg speed: 10.3987 tokens/s, remaining time: 0:26:33 +pred is: + ['A form of anthrax'] + label is: + ['a form of anthrax'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:07:31,567 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:31,567 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 357, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:31,568 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:31,568 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:31,568 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:32,514 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:32,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:32,579 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:32,610 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:32,613 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0447051525115967 s; generated tokens: 4 tokens; generate speed: 3.8288315036864895 tokens/s +2024-07-30 14:07:32,618 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:32,618 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[906/2067], cost time 1.0559s, every example cost time is 1.0559, generate speed: 3.7883 tokens/s, avg speed: 10.3931 tokens/s, remaining time: 0:26:31 +pred is: + ['33%'] + label is: + ['about a third.'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:07:32,700 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:32,701 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 255, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:32,701 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:32,701 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:32,701 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:33,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:33,679 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:33,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:33,741 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:33,772 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:33,803 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:33,834 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:33,866 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:33,897 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:33,927 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:34,022 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3209245204925537 s; generated tokens: 13 tokens; generate speed: 9.841591853524294 tokens/s +2024-07-30 14:07:34,028 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:34,028 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[907/2067], cost time 1.3324s, every example cost time is 1.3324, generate speed: 9.7570 tokens/s, avg speed: 10.3924 tokens/s, remaining time: 0:26:29 +pred is: + ['The plague returned to Europe in 1628-31'] + label is: + ['throughout the 14th to 17th centuries'] +The F1/Em of this example is: {'F1': 24.999999999999993, 'Em': 0.0} +2024-07-30 14:07:34,110 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:34,110 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 271, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:34,111 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:34,111 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:34,111 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:35,057 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:35,091 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:35,122 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:35,153 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:35,184 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:35,215 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:35,246 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:35,277 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:35,309 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:35,340 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:35,650 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.539013385772705 s; generated tokens: 20 tokens; generate speed: 12.995338562281859 tokens/s +2024-07-30 14:07:35,655 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:35,656 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[908/2067], cost time 1.5503s, every example cost time is 1.5503, generate speed: 12.9008 tokens/s, avg speed: 10.3956 tokens/s, remaining time: 0:26:28 +pred is: + ['1'] + label is: + ['propose a range of preincident population figures from as high as 7 million to as low as 4 million'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:07:35,738 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:35,739 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 324, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:35,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:35,739 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:35,740 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:36,684 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:36,717 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:36,748 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:36,780 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:36,811 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:36,814 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0741181373596191 s; generated tokens: 5 tokens; generate speed: 4.65498144579415 tokens/s +2024-07-30 14:07:36,819 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:36,819 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[909/2067], cost time 1.0852s, every example cost time is 1.0852, generate speed: 4.6073 tokens/s, avg speed: 10.3905 tokens/s, remaining time: 0:26:27 +pred is: + ['40,000'] + label is: + ['40,000'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:07:36,907 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:36,907 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 223, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:36,908 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:36,908 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:36,908 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:37,852 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:37,886 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:37,917 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:37,949 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:37,981 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:38,012 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:38,015 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1066901683807373 s; generated tokens: 6 tokens; generate speed: 5.421571611844125 tokens/s +2024-07-30 14:07:38,020 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:38,020 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[910/2067], cost time 1.1182s, every example cost time is 1.1182, generate speed: 5.3660 tokens/s, avg speed: 10.3860 tokens/s, remaining time: 0:26:25 +pred is: + ['1.7 million'] + label is: + ['some 1.7 million victims'] +The F1/Em of this example is: {'F1': 60.0, 'Em': 0.0} +F1 score: 61.978875344260715, Em score: 47.69230769230769, current_count: 910 +2024-07-30 14:07:38,364 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:38,365 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 217, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:38,365 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:38,365 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:38,366 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:39,309 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:39,342 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:39,374 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:39,404 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:39,435 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:39,479 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:39,511 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:39,514 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1483583450317383 s; generated tokens: 7 tokens; generate speed: 6.095658232715271 tokens/s +2024-07-30 14:07:39,519 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:39,519 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[911/2067], cost time 1.1598s, every example cost time is 1.1598, generate speed: 6.0353 tokens/s, avg speed: 10.3820 tokens/s, remaining time: 0:26:23 +pred is: + ['1500-1850'] + label is: + ['between 1500 and 1850'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:07:39,602 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:39,602 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 267, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:39,603 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:39,603 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:39,603 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:40,548 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:40,581 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:40,613 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:40,644 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:40,675 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:40,707 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:40,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:40,742 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1386828422546387 s; generated tokens: 7 tokens; generate speed: 6.147453654557324 tokens/s +2024-07-30 14:07:40,747 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:40,747 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[912/2067], cost time 1.1499s, every example cost time is 1.1499, generate speed: 6.0875 tokens/s, avg speed: 10.3780 tokens/s, remaining time: 0:26:22 +pred is: + ['magma'] + label is: + ['melt (magma and/or lava)'] +The F1/Em of this example is: {'F1': 20.0, 'Em': 0.0} +2024-07-30 14:07:40,830 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:40,831 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 223, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:40,831 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:40,831 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:40,832 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:41,776 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:41,809 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:41,841 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:41,872 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:41,903 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:41,934 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:41,937 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1056358814239502 s; generated tokens: 6 tokens; generate speed: 5.426741390006799 tokens/s +2024-07-30 14:07:41,942 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:41,942 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[913/2067], cost time 1.1172s, every example cost time is 1.1172, generate speed: 5.3708 tokens/s, avg speed: 10.3735 tokens/s, remaining time: 0:26:20 +pred is: + ['seafloor spreading'] + label is: + ['seafloor spreading'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:07:42,025 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:42,025 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 254, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:42,025 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:42,026 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:42,026 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:42,970 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:43,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:43,035 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:43,067 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:43,098 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:43,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:43,160 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:43,191 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:43,222 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:43,253 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:43,567 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5409836769104004 s; generated tokens: 20 tokens; generate speed: 12.978722811716642 tokens/s +2024-07-30 14:07:43,572 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:43,572 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[914/2067], cost time 1.5526s, every example cost time is 1.5526, generate speed: 12.8815 tokens/s, avg speed: 10.3767 tokens/s, remaining time: 0:26:19 +pred is: + ['1'] + label is: + ['divergent boundaries'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:07:43,654 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:43,654 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 224, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:43,655 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:43,655 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:43,655 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:44,599 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:44,632 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:44,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:44,696 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:44,727 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:44,758 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:44,789 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:44,821 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:44,851 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:44,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:45,194 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5390045642852783 s; generated tokens: 20 tokens; generate speed: 12.995413050830102 tokens/s +2024-07-30 14:07:45,199 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:45,200 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[915/2067], cost time 1.5505s, every example cost time is 1.5505, generate speed: 12.8989 tokens/s, avg speed: 10.3798 tokens/s, remaining time: 0:26:18 +pred is: + ['P-waves'] + label is: + ['seismic waves'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:07:45,282 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:45,282 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 216, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:45,283 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:45,283 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:45,283 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:46,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:46,259 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:46,291 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:46,322 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:46,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:46,385 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:46,416 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:46,446 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:46,477 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:46,508 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:46,788 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.50482177734375 s; generated tokens: 19 tokens; generate speed: 12.626079902656661 tokens/s +2024-07-30 14:07:46,793 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:46,793 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[916/2067], cost time 1.5163s, every example cost time is 1.5163, generate speed: 12.5303 tokens/s, avg speed: 10.3824 tokens/s, remaining time: 0:26:16 +pred is: + ['The second timeline is needed to show the most recent eon with an expanded scale.'] + label is: + ['second scale shows the most recent eon with an expanded scale'] +The F1/Em of this example is: {'F1': 62.745098039215684, 'Em': 0.0} +2024-07-30 14:07:46,877 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:46,877 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:46,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:46,878 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:46,878 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:47,821 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:47,853 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:47,885 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:47,916 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:47,946 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:47,978 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:48,008 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:48,039 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:48,070 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:48,101 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:48,411 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5327835083007812 s; generated tokens: 20 tokens; generate speed: 13.048157089171498 tokens/s +2024-07-30 14:07:48,416 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:48,416 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[917/2067], cost time 1.5442s, every example cost time is 1.5442, generate speed: 12.9518 tokens/s, avg speed: 10.3855 tokens/s, remaining time: 0:26:15 +pred is: + ['The principle of cross-cutting relationships'] + label is: + ['The principle of cross-cutting relationships'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:07:48,500 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:48,500 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 180, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:48,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:48,501 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:48,501 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:49,444 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:49,477 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:49,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:49,549 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:49,581 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:49,612 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:49,615 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.113851547241211 s; generated tokens: 6 tokens; generate speed: 5.386714248286325 tokens/s +2024-07-30 14:07:49,620 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:49,620 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[918/2067], cost time 1.1253s, every example cost time is 1.1253, generate speed: 5.3321 tokens/s, avg speed: 10.3810 tokens/s, remaining time: 0:26:14 +pred is: + ['Xenoliths'] + label is: + ['xenoliths'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:07:49,702 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:49,702 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 190, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:49,703 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:49,703 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:49,703 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:50,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:50,679 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:50,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:50,742 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:50,773 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:50,804 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:50,835 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:50,866 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:50,868 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1648917198181152 s; generated tokens: 8 tokens; generate speed: 6.867591093573152 tokens/s +2024-07-30 14:07:50,873 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:50,873 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[919/2067], cost time 1.1762s, every example cost time is 1.1762, generate speed: 6.8016 tokens/s, avg speed: 10.3777 tokens/s, remaining time: 0:26:12 +pred is: + ['The principle of faunal succession'] + label is: + ['The principle of faunal succession'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:07:50,956 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:50,957 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 165, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:50,957 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:50,957 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:50,958 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:51,901 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:51,933 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:51,965 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:51,996 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:52,026 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:52,057 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:52,088 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:52,119 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:52,150 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:52,180 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:52,490 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5324945449829102 s; generated tokens: 20 tokens; generate speed: 13.050617416862018 tokens/s +2024-07-30 14:07:52,495 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:52,495 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[920/2067], cost time 1.5437s, every example cost time is 1.5437, generate speed: 12.9555 tokens/s, avg speed: 10.3808 tokens/s, remaining time: 0:26:11 +pred is: + ['1900'] + label is: + ['At the beginning of the 20th century'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 61.82991484925703, Em score: 47.608695652173914, current_count: 920 +2024-07-30 14:07:52,847 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:52,848 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 235, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:52,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:52,848 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:52,848 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:53,792 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:53,827 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:53,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:53,891 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:53,922 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:53,953 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:53,984 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:54,015 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:54,046 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:54,077 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:54,388 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.539076805114746 s; generated tokens: 20 tokens; generate speed: 12.994803075151859 tokens/s +2024-07-30 14:07:54,392 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:54,393 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[921/2067], cost time 1.5507s, every example cost time is 1.5507, generate speed: 12.8975 tokens/s, avg speed: 10.3839 tokens/s, remaining time: 0:26:10 +pred is: + ['1'] + label is: + ['Thermochemical techniques'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:07:54,475 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:54,475 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 328, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:54,476 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:54,476 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:54,476 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:55,422 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:55,455 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:55,486 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:55,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:55,549 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:55,581 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:55,612 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:55,643 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:55,674 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:55,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:55,739 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2625246047973633 s; generated tokens: 11 tokens; generate speed: 8.712701485738975 tokens/s +2024-07-30 14:07:55,744 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:55,744 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[922/2067], cost time 1.2739s, every example cost time is 1.2739, generate speed: 8.6351 tokens/s, avg speed: 10.3822 tokens/s, remaining time: 0:26:08 +pred is: + ['Horizontal compression'] + label is: + ['horizontal compression'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:07:55,826 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:55,826 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 207, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:55,827 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:55,827 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:55,827 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:56,771 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:56,804 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:56,835 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:56,838 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0109782218933105 s; generated tokens: 3 tokens; generate speed: 2.967422972160317 tokens/s +2024-07-30 14:07:56,843 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:56,843 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[923/2067], cost time 1.0221s, every example cost time is 1.0221, generate speed: 2.9352 tokens/s, avg speed: 10.3761 tokens/s, remaining time: 0:26:06 +pred is: + ['True'] + label is: + ['Extension'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:07:56,925 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:56,925 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 261, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:56,926 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:56,926 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:56,926 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:57,871 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:57,904 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:57,935 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:57,966 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:57,969 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.042304515838623 s; generated tokens: 4 tokens; generate speed: 3.837650071756293 tokens/s +2024-07-30 14:07:57,973 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:57,974 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[924/2067], cost time 1.0533s, every example cost time is 1.0533, generate speed: 3.7975 tokens/s, avg speed: 10.3707 tokens/s, remaining time: 0:26:05 +pred is: + ['Dikes'] + label is: + ['Dikes'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:07:58,060 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:58,061 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 308, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:58,061 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:58,061 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:58,062 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:07:59,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:59,043 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:59,075 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:59,106 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:59,137 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:59,168 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:59,199 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:59,230 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:59,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:59,264 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2022783756256104 s; generated tokens: 9 tokens; generate speed: 7.485787137539435 tokens/s +2024-07-30 14:07:59,269 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:07:59,269 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[925/2067], cost time 1.2137s, every example cost time is 1.2137, generate speed: 7.4151 tokens/s, avg speed: 10.3678 tokens/s, remaining time: 0:26:03 +pred is: + ['layered basaltic lava flows'] + label is: + ['layered basaltic lava flows'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:07:59,352 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:07:59,352 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 162, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:07:59,352 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:07:59,353 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:07:59,353 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:00,296 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:00,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:00,360 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:00,391 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:00,423 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:00,454 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:00,485 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:00,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:00,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:00,579 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:00,879 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5255446434020996 s; generated tokens: 19 tokens; generate speed: 12.454568328874544 tokens/s +2024-07-30 14:08:00,883 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:00,884 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[926/2067], cost time 1.5368s, every example cost time is 1.5368, generate speed: 12.3634 tokens/s, avg speed: 10.3702 tokens/s, remaining time: 0:26:02 +pred is: + ['The study of rocks'] + label is: + ['the study of rocks'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:08:00,967 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:00,967 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 205, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:00,967 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:00,967 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:00,968 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:01,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:01,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:01,975 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:02,006 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:02,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:02,068 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:02,099 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:02,130 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:02,161 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:02,192 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:02,501 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.533064365386963 s; generated tokens: 20 tokens; generate speed: 13.04576666939341 tokens/s +2024-07-30 14:08:02,506 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:02,506 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[927/2067], cost time 1.5442s, every example cost time is 1.5442, generate speed: 12.9517 tokens/s, avg speed: 10.3734 tokens/s, remaining time: 0:26:01 +pred is: + ['1'] + label is: + ['identifying rocks'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:08:02,588 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:02,589 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 146, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:02,589 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:02,589 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:02,589 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:03,532 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:03,565 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:03,596 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:03,627 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:03,658 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:03,689 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:03,720 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:03,750 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:03,781 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:03,812 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:04,121 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5315155982971191 s; generated tokens: 20 tokens; generate speed: 13.05895938783637 tokens/s +2024-07-30 14:08:04,126 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:04,126 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[928/2067], cost time 1.5426s, every example cost time is 1.5426, generate speed: 12.9651 tokens/s, avg speed: 10.3765 tokens/s, remaining time: 0:26:00 +pred is: + ['1'] + label is: + ['pressure physical experiments'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:08:04,209 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:04,209 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 143, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:04,210 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:04,210 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:04,210 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:05,152 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:05,185 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:05,216 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:05,247 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:05,278 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:05,308 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:05,339 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:05,370 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:05,401 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:05,431 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:05,739 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.528763771057129 s; generated tokens: 20 tokens; generate speed: 13.082465962789103 tokens/s +2024-07-30 14:08:05,744 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:05,744 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[929/2067], cost time 1.5399s, every example cost time is 1.5399, generate speed: 12.9880 tokens/s, avg speed: 10.3797 tokens/s, remaining time: 0:25:58 +pred is: + ['1'] + label is: + ['Structural geologists'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:08:05,851 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:05,851 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:05,852 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:05,852 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:05,852 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:06,796 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:06,829 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:06,860 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:06,891 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:06,922 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:06,953 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:06,984 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:07,015 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:07,046 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:07,077 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:07,385 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5322754383087158 s; generated tokens: 20 tokens; generate speed: 13.052483580938594 tokens/s +2024-07-30 14:08:07,389 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:07,390 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[930/2067], cost time 1.5438s, every example cost time is 1.5438, generate speed: 12.9550 tokens/s, avg speed: 10.3828 tokens/s, remaining time: 0:25:57 +pred is: + ['orogenic wedges'] + label is: + ['orogenic wedges'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 61.70271146378115, Em score: 47.634408602150536, current_count: 930 +2024-07-30 14:08:07,742 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:07,742 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 178, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:07,743 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:07,743 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:07,743 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:08,686 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:08,718 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:08,771 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:08,803 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:08,834 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:08,865 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:08,895 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:08,926 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:08,929 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1857500076293945 s; generated tokens: 8 tokens; generate speed: 6.746784691989136 tokens/s +2024-07-30 14:08:08,934 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:08,934 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[931/2067], cost time 1.1970s, every example cost time is 1.1970, generate speed: 6.6835 tokens/s, avg speed: 10.3793 tokens/s, remaining time: 0:25:56 +pred is: + ['1'] + label is: + ['stratigraphers'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:08:09,016 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:09,016 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:09,017 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:09,017 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:09,017 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:09,960 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:09,993 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:10,024 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:10,055 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:10,086 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:10,117 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:10,147 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:10,178 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:10,209 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:10,240 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:10,418 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4010405540466309 s; generated tokens: 15 tokens; generate speed: 10.70632820490131 tokens/s +2024-07-30 14:08:10,423 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:10,423 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[932/2067], cost time 1.4122s, every example cost time is 1.4122, generate speed: 10.6220 tokens/s, avg speed: 10.3796 tokens/s, remaining time: 0:25:54 +pred is: + ['To provide better absolute bounds on the timing and rates of deposition.'] + label is: + ['provide better absolute bounds on the timing and rates of deposition'] +The F1/Em of this example is: {'F1': 93.33333333333333, 'Em': 0.0} +2024-07-30 14:08:10,506 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:10,506 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 286, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:10,507 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:10,507 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:10,507 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:11,452 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:11,485 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:11,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:11,520 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0122296810150146 s; generated tokens: 3 tokens; generate speed: 2.9637542311461824 tokens/s +2024-07-30 14:08:11,524 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:11,525 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[933/2067], cost time 1.0232s, every example cost time is 1.0232, generate speed: 2.9318 tokens/s, avg speed: 10.3736 tokens/s, remaining time: 0:25:53 +pred is: + ['1'] + label is: + ['Persia'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:08:11,607 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:11,607 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 164, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:11,607 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:11,608 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:11,608 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:12,551 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:12,584 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:12,617 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:12,649 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:12,682 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:12,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:12,747 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:12,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:12,811 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:12,844 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:12,879 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2707045078277588 s; generated tokens: 11 tokens; generate speed: 8.656615233705478 tokens/s +2024-07-30 14:08:12,883 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:12,884 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[934/2067], cost time 1.2819s, every example cost time is 1.2819, generate speed: 8.5810 tokens/s, avg speed: 10.3718 tokens/s, remaining time: 0:25:51 +pred is: + ['James Hutton'] + label is: + ['James Hutton'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:08:12,966 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:12,966 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 205, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:12,966 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:12,967 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:12,967 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:13,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:13,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:13,975 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:14,006 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:14,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:14,068 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:14,071 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1041738986968994 s; generated tokens: 6 tokens; generate speed: 5.433926673217827 tokens/s +2024-07-30 14:08:14,076 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:14,076 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[935/2067], cost time 1.1153s, every example cost time is 1.1153, generate speed: 5.3798 tokens/s, avg speed: 10.3675 tokens/s, remaining time: 0:25:49 +pred is: + ['William Maclure'] + label is: + ['William Maclure'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:08:14,158 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:14,158 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 159, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:14,158 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:14,159 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:14,159 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:15,101 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:15,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:15,165 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:15,197 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:15,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:15,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:15,289 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:15,320 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:15,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:15,382 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:15,716 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5564985275268555 s; generated tokens: 20 tokens; generate speed: 12.84935362693745 tokens/s +2024-07-30 14:08:15,720 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:15,721 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[936/2067], cost time 1.5677s, every example cost time is 1.5677, generate speed: 12.7574 tokens/s, avg speed: 10.3704 tokens/s, remaining time: 0:25:48 +pred is: + ['Principles of Geology'] + label is: + ['Principles of Geology'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:08:15,803 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:15,803 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 293, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:15,804 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:15,804 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:15,804 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:16,749 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:16,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:16,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:16,846 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:16,877 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:16,909 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:16,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:16,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:17,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:17,033 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:17,036 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.232001781463623 s; generated tokens: 10 tokens; generate speed: 8.116871379942292 tokens/s +2024-07-30 14:08:17,041 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:17,041 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[937/2067], cost time 1.2431s, every example cost time is 1.2431, generate speed: 8.0442 tokens/s, avg speed: 10.3682 tokens/s, remaining time: 0:25:47 +pred is: + ['103'] + label is: + ['103 miles'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:08:17,123 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:17,123 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 229, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:17,124 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:17,124 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:17,124 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:18,068 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:18,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:18,132 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:18,163 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:18,194 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:18,225 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:18,278 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:18,310 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:18,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:18,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:18,683 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5591444969177246 s; generated tokens: 20 tokens; generate speed: 12.827547439982654 tokens/s +2024-07-30 14:08:18,688 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:18,689 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[938/2067], cost time 1.5704s, every example cost time is 1.5704, generate speed: 12.7359 tokens/s, avg speed: 10.3711 tokens/s, remaining time: 0:25:46 +pred is: + ['Robert Curthose'] + label is: + ['Robert Curthose'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:08:18,771 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:18,771 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 276, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:18,772 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:18,772 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:18,772 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:19,717 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:19,752 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:19,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:19,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:19,849 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:19,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:19,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:19,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:19,973 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:20,004 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:20,314 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5419855117797852 s; generated tokens: 20 tokens; generate speed: 12.97029047757762 tokens/s +2024-07-30 14:08:20,319 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:20,319 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[939/2067], cost time 1.5532s, every example cost time is 1.5532, generate speed: 12.8763 tokens/s, avg speed: 10.3741 tokens/s, remaining time: 0:25:45 +pred is: + ['Pons Aelius'] + label is: + ['Pons Aelius'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:08:20,427 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:20,427 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 188, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:20,427 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:20,428 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:20,428 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:21,371 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:21,404 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:21,436 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:21,439 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.011240005493164 s; generated tokens: 3 tokens; generate speed: 2.9666547839322797 tokens/s +2024-07-30 14:08:21,444 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:21,444 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[940/2067], cost time 1.0228s, every example cost time is 1.0228, generate speed: 2.9332 tokens/s, avg speed: 10.3682 tokens/s, remaining time: 0:25:43 +pred is: + ['England'] + label is: + ["England's"] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +F1 score: 61.783888292180634, Em score: 47.659574468085104, current_count: 940 +2024-07-30 14:08:21,798 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:21,798 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 204, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:21,799 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:21,799 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:21,799 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:22,742 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:22,775 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:22,806 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:22,809 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0098598003387451 s; generated tokens: 3 tokens; generate speed: 2.970709398466685 tokens/s +2024-07-30 14:08:22,814 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:22,814 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[941/2067], cost time 1.0213s, every example cost time is 1.0213, generate speed: 2.9376 tokens/s, avg speed: 10.3623 tokens/s, remaining time: 0:25:41 +pred is: + ['coal'] + label is: + ['coal'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:08:22,895 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:22,896 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 210, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:22,896 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:22,896 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:22,897 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:23,840 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:23,873 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:23,905 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:23,936 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:23,967 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:23,998 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:24,029 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:24,060 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:24,091 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:24,122 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:24,432 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5354304313659668 s; generated tokens: 20 tokens; generate speed: 13.025663417526104 tokens/s +2024-07-30 14:08:24,437 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:24,437 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[942/2067], cost time 1.5467s, every example cost time is 1.5467, generate speed: 12.9308 tokens/s, avg speed: 10.3654 tokens/s, remaining time: 0:25:40 +pred is: + ['1'] + label is: + ['their families'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:08:24,520 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:24,521 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 187, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:24,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:24,521 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:24,522 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:25,465 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:25,498 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:25,530 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:25,561 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:25,564 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0421748161315918 s; generated tokens: 4 tokens; generate speed: 3.8381276711784733 tokens/s +2024-07-30 14:08:25,569 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:25,569 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[943/2067], cost time 1.0537s, every example cost time is 1.0537, generate speed: 3.7960 tokens/s, avg speed: 10.3600 tokens/s, remaining time: 0:25:38 +pred is: + ['The King'] + label is: + ['the King'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:08:25,651 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:25,651 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 303, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:25,652 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:25,652 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:25,652 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:26,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:26,630 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:26,661 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:26,692 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:26,724 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:26,755 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:26,786 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:26,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:26,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:26,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:27,161 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5087907314300537 s; generated tokens: 19 tokens; generate speed: 12.592866329442204 tokens/s +2024-07-30 14:08:27,166 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:27,166 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[944/2067], cost time 1.5201s, every example cost time is 1.5201, generate speed: 12.4995 tokens/s, avg speed: 10.3625 tokens/s, remaining time: 0:25:37 +pred is: + ['Urbanization'] + label is: + ['urbanization'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:08:27,249 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:27,250 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 207, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:27,250 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:27,251 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:27,251 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:28,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:28,228 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:28,259 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:28,315 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:28,319 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.068052053451538 s; generated tokens: 4 tokens; generate speed: 3.7451358171856146 tokens/s +2024-07-30 14:08:28,324 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:28,324 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[945/2067], cost time 1.0797s, every example cost time is 1.0797, generate speed: 3.7047 tokens/s, avg speed: 10.3570 tokens/s, remaining time: 0:25:35 +pred is: + ['Medieval'] + label is: + ['medieval'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:08:28,406 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:28,406 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 240, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:28,406 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:28,407 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:28,407 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:29,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:29,384 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:29,419 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:29,451 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:29,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:29,513 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:29,544 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:29,584 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:29,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:29,647 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:29,959 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5524303913116455 s; generated tokens: 20 tokens; generate speed: 12.883025295003428 tokens/s +2024-07-30 14:08:29,964 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:29,965 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[946/2067], cost time 1.5638s, every example cost time is 1.5638, generate speed: 12.7895 tokens/s, avg speed: 10.3599 tokens/s, remaining time: 0:25:34 +pred is: + ['The city has an extensive neoclassical centre referred to as Tyneside Classical largely developed'] + label is: + ['Tyneside Classical'] +The F1/Em of this example is: {'F1': 20.0, 'Em': 0.0} +2024-07-30 14:08:30,071 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:30,071 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 203, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:30,071 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:30,072 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:30,072 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:31,015 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:31,048 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:31,080 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:31,111 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:31,114 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0422537326812744 s; generated tokens: 4 tokens; generate speed: 3.837837058841426 tokens/s +2024-07-30 14:08:31,119 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:31,119 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[947/2067], cost time 1.0539s, every example cost time is 1.0539, generate speed: 3.7953 tokens/s, avg speed: 10.3546 tokens/s, remaining time: 0:25:32 +pred is: + ['Town Moor'] + label is: + ['Town Moor'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:08:31,202 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:31,202 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 219, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:31,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:31,203 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:31,203 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:32,147 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:32,180 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:32,212 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:32,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:32,275 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:32,306 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:32,337 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:32,340 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1370434761047363 s; generated tokens: 7 tokens; generate speed: 6.156316928162218 tokens/s +2024-07-30 14:08:32,345 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:32,345 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[948/2067], cost time 1.1483s, every example cost time is 1.1483, generate speed: 6.0959 tokens/s, avg speed: 10.3508 tokens/s, remaining time: 0:25:31 +pred is: + ['imposing new office developments'] + label is: + ['Large-scale regeneration'] +The F1/Em of this example is: {'F1': 20.0, 'Em': 0.0} +2024-07-30 14:08:32,427 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:32,428 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 189, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:32,428 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:32,428 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:32,429 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:33,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:33,405 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:33,436 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:33,468 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:33,499 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:33,530 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:33,561 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:33,592 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:33,623 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:33,653 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:33,963 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5338761806488037 s; generated tokens: 20 tokens; generate speed: 13.038862101333589 tokens/s +2024-07-30 14:08:33,967 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:33,968 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[949/2067], cost time 1.5452s, every example cost time is 1.5452, generate speed: 12.9429 tokens/s, avg speed: 10.3539 tokens/s, remaining time: 0:25:30 +pred is: + ['Grainger Town'] + label is: + ['the Grainger Town area'] +The F1/Em of this example is: {'F1': 60.0, 'Em': 0.0} +2024-07-30 14:08:34,049 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:34,049 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:34,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:34,050 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:34,050 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:34,993 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:35,026 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:35,058 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:35,089 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:35,120 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:35,123 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0720443725585938 s; generated tokens: 5 tokens; generate speed: 4.663986051311248 tokens/s +2024-07-30 14:08:35,127 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:35,128 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[950/2067], cost time 1.0833s, every example cost time is 1.0833, generate speed: 4.6156 tokens/s, avg speed: 10.3491 tokens/s, remaining time: 0:25:28 +pred is: + ['Butcher Market'] + label is: + ['the Butcher Market'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +F1 score: 61.844057889105066, Em score: 47.68421052631579, current_count: 950 +2024-07-30 14:08:35,494 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:35,495 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 198, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:35,495 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:35,495 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:35,496 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:36,438 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:36,471 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:36,502 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:36,533 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:36,536 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0398979187011719 s; generated tokens: 4 tokens; generate speed: 3.8465314028092132 tokens/s +2024-07-30 14:08:36,540 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:36,541 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[951/2067], cost time 1.0514s, every example cost time is 1.0514, generate speed: 3.8046 tokens/s, avg speed: 10.3438 tokens/s, remaining time: 0:25:26 +pred is: + ['Oceanic'] + label is: + ['oceanic'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:08:36,622 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:36,623 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 310, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:36,623 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:36,623 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:36,624 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:37,569 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:37,602 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:37,635 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:37,667 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:37,698 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:37,729 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:37,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:37,791 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:37,823 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:37,853 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:38,167 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5426387786865234 s; generated tokens: 20 tokens; generate speed: 12.964797901054295 tokens/s +2024-07-30 14:08:38,171 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:38,172 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[952/2067], cost time 1.5540s, every example cost time is 1.5540, generate speed: 12.8702 tokens/s, avg speed: 10.3468 tokens/s, remaining time: 0:25:25 +pred is: + ['2010'] + label is: + ['2010'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:08:38,265 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:38,265 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 151, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:38,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:38,266 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:38,266 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:39,208 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:39,241 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:39,273 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:39,277 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0105431079864502 s; generated tokens: 3 tokens; generate speed: 2.9687006682749306 tokens/s +2024-07-30 14:08:39,281 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:39,282 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[953/2067], cost time 1.0221s, every example cost time is 1.0221, generate speed: 2.9351 tokens/s, avg speed: 10.3410 tokens/s, remaining time: 0:25:23 +pred is: + ['Shopping'] + label is: + ['shopping'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:08:39,363 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:39,363 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 184, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:39,364 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:39,364 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:39,364 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:40,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:40,340 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:40,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:40,403 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:40,434 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:40,466 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:40,497 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:40,528 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:40,558 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:40,589 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:40,900 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5358374118804932 s; generated tokens: 20 tokens; generate speed: 13.02221175580807 tokens/s +2024-07-30 14:08:40,905 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:40,905 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[954/2067], cost time 1.5469s, every example cost time is 1.5469, generate speed: 12.9288 tokens/s, avg speed: 10.3441 tokens/s, remaining time: 0:25:22 +pred is: + ['Tyneside flats'] + label is: + ['The Tyneside flat'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:08:40,988 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:40,988 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 191, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:40,989 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:40,989 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:40,989 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:41,932 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:41,966 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:41,997 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:42,029 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:42,060 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:42,096 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:42,099 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1095504760742188 s; generated tokens: 6 tokens; generate speed: 5.407595354498009 tokens/s +2024-07-30 14:08:42,104 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:42,104 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[955/2067], cost time 1.1207s, every example cost time is 1.1207, generate speed: 5.3539 tokens/s, avg speed: 10.3398 tokens/s, remaining time: 0:25:20 +pred is: + ['7.8%'] + label is: + ['7.8%'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:08:42,186 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:42,187 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 286, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:42,187 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:42,187 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:42,188 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:43,132 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:43,165 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:43,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:43,228 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:43,259 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:43,290 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:43,321 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:43,352 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:43,383 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:43,414 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:43,448 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2602565288543701 s; generated tokens: 11 tokens; generate speed: 8.728381681148278 tokens/s +2024-07-30 14:08:43,453 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:43,453 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[956/2067], cost time 1.2713s, every example cost time is 1.2713, generate speed: 8.6524 tokens/s, avg speed: 10.3381 tokens/s, remaining time: 0:25:19 +pred is: + ['2001'] + label is: + ['2001'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:08:43,535 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:43,535 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 185, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:43,535 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:43,535 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:43,536 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:44,478 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:44,511 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:44,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:44,574 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:44,605 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:44,608 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0722780227661133 s; generated tokens: 5 tokens; generate speed: 4.662969765156332 tokens/s +2024-07-30 14:08:44,613 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:44,613 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[957/2067], cost time 1.0834s, every example cost time is 1.0834, generate speed: 4.6152 tokens/s, avg speed: 10.3334 tokens/s, remaining time: 0:25:17 +pred is: + ['37.8'] + label is: + ['37.8'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:08:44,694 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:44,695 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 268, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:44,695 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:44,695 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:44,696 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:45,640 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:45,673 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:45,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:45,736 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:45,767 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:45,797 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:45,828 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:45,860 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:45,891 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:45,922 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:46,233 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5371320247650146 s; generated tokens: 20 tokens; generate speed: 13.011244107712512 tokens/s +2024-07-30 14:08:46,238 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:46,238 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[958/2067], cost time 1.5484s, every example cost time is 1.5484, generate speed: 12.9168 tokens/s, avg speed: 10.3365 tokens/s, remaining time: 0:25:16 +pred is: + ['Geordie'] + label is: + ['Geordie'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:08:46,321 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:46,321 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 278, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:46,322 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:46,322 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:46,322 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:47,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:47,299 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:47,331 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:47,362 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:47,393 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:47,396 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0738935470581055 s; generated tokens: 5 tokens; generate speed: 4.655954972163981 tokens/s +2024-07-30 14:08:47,401 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:47,401 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[959/2067], cost time 1.0851s, every example cost time is 1.0851, generate speed: 4.6078 tokens/s, avg speed: 10.3317 tokens/s, remaining time: 0:25:14 +pred is: + ['Scandinavia'] + label is: + ['Scandinavia'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:08:47,483 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:47,483 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 165, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:47,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:47,484 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:47,484 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:48,427 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:48,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:48,491 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:48,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:48,553 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:48,584 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:48,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:48,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:48,684 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:48,716 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:49,025 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5407066345214844 s; generated tokens: 20 tokens; generate speed: 12.98105658265802 tokens/s +2024-07-30 14:08:49,030 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:49,030 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[960/2067], cost time 1.5519s, every example cost time is 1.5519, generate speed: 12.8876 tokens/s, avg speed: 10.3347 tokens/s, remaining time: 0:25:13 +pred is: + ['1'] + label is: + ['a report'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 62.085265619426885, Em score: 48.020833333333336, current_count: 960 +2024-07-30 14:08:49,389 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:49,389 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 206, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:49,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:49,390 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:49,391 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:50,337 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:50,370 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:50,401 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:50,433 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:50,463 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:50,494 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:50,525 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:50,556 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:50,587 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:50,618 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:50,930 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5390267372131348 s; generated tokens: 20 tokens; generate speed: 12.99522582448174 tokens/s +2024-07-30 14:08:50,935 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:50,935 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[961/2067], cost time 1.5508s, every example cost time is 1.5508, generate speed: 12.8969 tokens/s, avg speed: 10.3378 tokens/s, remaining time: 0:25:12 +pred is: + ['Collingwood Street'] + label is: + ['Collingwood Street'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:08:51,017 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:51,017 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 156, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:51,018 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:51,018 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:51,018 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:51,961 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:51,994 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:52,025 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:52,056 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:52,059 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0408520698547363 s; generated tokens: 4 tokens; generate speed: 3.8430052798552334 tokens/s +2024-07-30 14:08:52,064 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:52,064 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[962/2067], cost time 1.0520s, every example cost time is 1.0520, generate speed: 3.8022 tokens/s, avg speed: 10.3325 tokens/s, remaining time: 0:25:10 +pred is: + ['Theatre'] + label is: + ['theatre'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:08:52,146 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:52,146 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 211, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:52,146 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:52,147 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:52,147 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:53,091 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:53,125 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:53,156 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:53,188 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:53,220 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:53,223 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0764484405517578 s; generated tokens: 5 tokens; generate speed: 4.644904309060207 tokens/s +2024-07-30 14:08:53,229 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:53,229 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[963/2067], cost time 1.0882s, every example cost time is 1.0882, generate speed: 4.5947 tokens/s, avg speed: 10.3278 tokens/s, remaining time: 0:25:09 +pred is: + ['Theatres'] + label is: + ['theatres'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:08:53,312 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:53,312 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 168, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:53,313 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:53,313 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:53,313 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:54,256 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:54,291 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:54,323 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:54,355 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:54,386 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:54,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:54,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:54,479 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:54,510 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:54,541 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:54,857 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5432617664337158 s; generated tokens: 20 tokens; generate speed: 12.959564239200644 tokens/s +2024-07-30 14:08:54,861 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:54,862 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[964/2067], cost time 1.5546s, every example cost time is 1.5546, generate speed: 12.8648 tokens/s, avg speed: 10.3308 tokens/s, remaining time: 0:25:07 +pred is: + ["The Literary and Philosophical Society of Newcastle upon Tyne (popularly known as the 'Lit"] + label is: + ['The Literary and Philosophical Society of Newcastle'] +The F1/Em of this example is: {'F1': 61.904761904761905, 'Em': 0.0} +2024-07-30 14:08:54,945 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:54,946 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 183, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:54,946 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:54,946 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:54,946 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:55,889 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:55,923 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:55,955 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:55,987 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:56,018 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:56,049 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:56,080 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:56,110 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:56,142 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:56,172 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:56,487 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5402874946594238 s; generated tokens: 20 tokens; generate speed: 12.984588961051223 tokens/s +2024-07-30 14:08:56,492 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:56,492 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[965/2067], cost time 1.5515s, every example cost time is 1.5515, generate speed: 12.8911 tokens/s, avg speed: 10.3338 tokens/s, remaining time: 0:25:06 +pred is: + ['Newcastle Beer Festival'] + label is: + ['The Newcastle Beer Festival'] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +2024-07-30 14:08:56,578 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:56,578 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 211, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:56,579 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:56,579 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:56,579 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:57,523 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:57,558 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:57,590 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:57,622 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:57,654 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:57,685 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:57,716 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:57,747 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:57,778 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:57,809 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:58,122 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5427420139312744 s; generated tokens: 20 tokens; generate speed: 12.963930339224529 tokens/s +2024-07-30 14:08:58,127 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:58,127 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[966/2067], cost time 1.5554s, every example cost time is 1.5554, generate speed: 12.8580 tokens/s, avg speed: 10.3368 tokens/s, remaining time: 0:25:05 +pred is: + ['The Hoppings'] + label is: + ['The Hoppings'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:08:58,209 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:58,209 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:58,210 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:58,210 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:58,210 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:08:59,153 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:59,186 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:59,217 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:59,248 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:59,279 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:59,310 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:59,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:59,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:59,403 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:59,406 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1951613426208496 s; generated tokens: 9 tokens; generate speed: 7.530364042953438 tokens/s +2024-07-30 14:08:59,410 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:08:59,411 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[967/2067], cost time 1.2062s, every example cost time is 1.2062, generate speed: 7.4613 tokens/s, avg speed: 10.3341 tokens/s, remaining time: 0:25:04 +pred is: + ['Newcastle Mela'] + label is: + ['Newcastle Mela'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:08:59,493 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:08:59,493 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 215, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:08:59,494 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:08:59,494 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:08:59,494 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:00,438 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:00,471 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:00,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:00,509 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0145893096923828 s; generated tokens: 3 tokens; generate speed: 2.9568614328388514 tokens/s +2024-07-30 14:09:00,514 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:00,514 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[968/2067], cost time 1.0257s, every example cost time is 1.0257, generate speed: 2.9248 tokens/s, avg speed: 10.3284 tokens/s, remaining time: 0:25:02 +pred is: + ['folk-rock'] + label is: + ['folk-rock'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:09:00,596 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:00,596 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 155, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:00,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:00,597 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:00,597 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:01,539 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:01,572 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:01,604 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:01,635 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:01,665 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:01,696 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:01,727 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:01,758 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:01,789 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:01,820 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:02,130 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.532334804534912 s; generated tokens: 20 tokens; generate speed: 13.051977897265289 tokens/s +2024-07-30 14:09:02,134 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:02,135 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[969/2067], cost time 1.5435s, every example cost time is 1.5435, generate speed: 12.9577 tokens/s, avg speed: 10.3315 tokens/s, remaining time: 0:25:01 +pred is: + ['2006-2008'] + label is: + ['November 2006 and May 2008'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:09:02,218 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:02,218 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 154, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:02,219 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:02,219 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:02,219 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:03,162 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:03,194 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:03,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:03,257 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:03,288 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:03,319 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:03,349 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:03,380 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:03,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:03,442 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:03,752 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5330276489257812 s; generated tokens: 20 tokens; generate speed: 13.046079119325958 tokens/s +2024-07-30 14:09:03,757 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:03,757 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[970/2067], cost time 1.5444s, every example cost time is 1.5444, generate speed: 12.9504 tokens/s, avg speed: 10.3345 tokens/s, remaining time: 0:24:59 +pred is: + ['Centre for Life'] + label is: + ['Centre for Life'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.31659081431742, Em score: 48.24742268041237, current_count: 970 +2024-07-30 14:09:04,126 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:04,126 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 193, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:04,127 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:04,127 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:04,127 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:05,070 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:05,104 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:05,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:05,167 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:05,198 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:05,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:05,260 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:05,291 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:05,322 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:05,352 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:05,662 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.534663438796997 s; generated tokens: 20 tokens; generate speed: 13.032173370649751 tokens/s +2024-07-30 14:09:05,667 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:05,667 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[971/2067], cost time 1.5462s, every example cost time is 1.5462, generate speed: 12.9347 tokens/s, avg speed: 10.3375 tokens/s, remaining time: 0:24:58 +pred is: + ['1939'] + label is: + ['On the Night of the Fire'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:09:05,750 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:05,750 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 248, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:05,751 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:05,751 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:05,751 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:06,695 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:06,729 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:06,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:06,791 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:06,822 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:06,853 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:06,884 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:06,915 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:06,946 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:06,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:07,073 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3216798305511475 s; generated tokens: 13 tokens; generate speed: 9.835967606904413 tokens/s +2024-07-30 14:09:07,078 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:07,078 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[972/2067], cost time 1.3330s, every example cost time is 1.3330, generate speed: 9.7526 tokens/s, avg speed: 10.3370 tokens/s, remaining time: 0:24:57 +pred is: + ['Gosforth Park'] + label is: + ['Gosforth Park'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:09:07,160 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:07,160 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 182, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:07,161 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:07,161 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:07,161 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:08,104 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:08,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:08,168 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:08,199 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:08,202 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0403149127960205 s; generated tokens: 4 tokens; generate speed: 3.8449895803659397 tokens/s +2024-07-30 14:09:08,206 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:08,207 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[973/2067], cost time 1.0515s, every example cost time is 1.0515, generate speed: 3.8041 tokens/s, avg speed: 10.3318 tokens/s, remaining time: 0:24:55 +pred is: + ['6 miles'] + label is: + ['6 miles'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:09:08,289 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:08,289 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:08,290 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:08,290 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:08,290 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:09,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:09,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:09,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:09,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:09,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:09,363 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.072319507598877 s; generated tokens: 5 tokens; generate speed: 4.6627893688103565 tokens/s +2024-07-30 14:09:09,367 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:09,368 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[974/2067], cost time 1.0834s, every example cost time is 1.0834, generate speed: 4.6153 tokens/s, avg speed: 10.3271 tokens/s, remaining time: 0:24:54 +pred is: + ['The Victorian architecture'] + label is: + ['Victorian architecture'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:09:09,452 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:09,453 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 159, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:09,453 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:09,453 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:09,454 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:10,397 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:10,430 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:10,462 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:10,493 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:10,524 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:10,527 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.073134422302246 s; generated tokens: 5 tokens; generate speed: 4.659248549005877 tokens/s +2024-07-30 14:09:10,532 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:10,532 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[975/2067], cost time 1.0852s, every example cost time is 1.0852, generate speed: 4.6076 tokens/s, avg speed: 10.3225 tokens/s, remaining time: 0:24:52 +pred is: + ['half-hourly'] + label is: + ['half-hourly'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:09:10,614 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:10,614 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 251, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:10,614 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:10,615 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:10,615 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:11,559 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:11,592 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:11,623 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:11,655 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:11,686 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:11,717 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:11,748 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:11,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:11,781 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.166489839553833 s; generated tokens: 8 tokens; generate speed: 6.858182325068425 tokens/s +2024-07-30 14:09:11,786 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:11,786 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[976/2067], cost time 1.1776s, every example cost time is 1.1776, generate speed: 6.7933 tokens/s, avg speed: 10.3194 tokens/s, remaining time: 0:24:50 +pred is: + ['The Tyne and Wear Metro'] + label is: + ['Tyne and Wear Metro'] +The F1/Em of this example is: {'F1': 87.50000000000001, 'Em': 0.0} +2024-07-30 14:09:11,869 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:11,869 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 222, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:11,869 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:11,870 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:11,870 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:12,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:12,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:12,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:12,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:12,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:12,974 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:13,004 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:13,035 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:13,066 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:13,097 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:13,134 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2641894817352295 s; generated tokens: 11 tokens; generate speed: 8.701227275599045 tokens/s +2024-07-30 14:09:13,139 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:13,139 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[977/2067], cost time 1.2753s, every example cost time is 1.2753, generate speed: 8.6251 tokens/s, avg speed: 10.3178 tokens/s, remaining time: 0:24:49 +pred is: + ['Metro: All Change'] + label is: + ["Metro: All Change.'"] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +2024-07-30 14:09:13,221 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:13,221 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 283, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:13,222 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:13,222 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:13,222 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:14,166 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:14,199 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:14,230 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:14,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:14,264 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0416715145111084 s; generated tokens: 4 tokens; generate speed: 3.8399821289894205 tokens/s +2024-07-30 14:09:14,269 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:14,269 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[978/2067], cost time 1.0527s, every example cost time is 1.0527, generate speed: 3.7998 tokens/s, avg speed: 10.3126 tokens/s, remaining time: 0:24:47 +pred is: + ['A1'] + label is: + ['the A1'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:09:14,350 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:14,350 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 241, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:14,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:14,351 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:14,351 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:15,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:15,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:15,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:15,362 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.010606050491333 s; generated tokens: 3 tokens; generate speed: 2.9685157718395514 tokens/s +2024-07-30 14:09:15,367 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:15,367 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[979/2067], cost time 1.0216s, every example cost time is 1.0216, generate speed: 2.9365 tokens/s, avg speed: 10.3070 tokens/s, remaining time: 0:24:45 +pred is: + ['3'] + label is: + ['3'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:09:15,449 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:15,450 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 190, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:15,450 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:15,450 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:15,450 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:16,393 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:16,425 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:16,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:16,492 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:16,523 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:16,554 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:16,585 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:16,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:16,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:16,677 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:16,711 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2599856853485107 s; generated tokens: 11 tokens; generate speed: 8.730257913174157 tokens/s +2024-07-30 14:09:16,715 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:16,716 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[980/2067], cost time 1.2712s, every example cost time is 1.2712, generate speed: 8.6536 tokens/s, avg speed: 10.3054 tokens/s, remaining time: 0:24:44 +pred is: + ['1998'] + label is: + ['1998'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.492782064511466, Em score: 48.265306122448976, current_count: 980 +2024-07-30 14:09:17,079 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:17,080 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:17,080 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:17,080 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:17,080 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:18,023 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:18,055 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:18,087 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:18,118 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:18,149 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:18,180 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:18,210 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:18,242 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:18,272 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:18,303 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:18,617 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5364024639129639 s; generated tokens: 20 tokens; generate speed: 13.01742249818013 tokens/s +2024-07-30 14:09:18,622 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:18,622 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[981/2067], cost time 1.5478s, every example cost time is 1.5478, generate speed: 12.9213 tokens/s, avg speed: 10.3084 tokens/s, remaining time: 0:24:43 +pred is: + ['1'] + label is: + ['Danish DFDS Seaways'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:09:18,704 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:18,705 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 257, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:18,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:18,705 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:18,706 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:19,650 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:19,683 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:19,715 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:19,758 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:19,790 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:19,821 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:19,852 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:19,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:19,914 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:19,945 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:19,948 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2423381805419922 s; generated tokens: 10 tokens; generate speed: 8.049338059977616 tokens/s +2024-07-30 14:09:19,953 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:19,953 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[982/2067], cost time 1.2535s, every example cost time is 1.2535, generate speed: 7.9776 tokens/s, avg speed: 10.3063 tokens/s, remaining time: 0:24:41 +pred is: + ['11'] + label is: + ['eleven'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:09:20,036 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:20,036 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 226, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:20,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:20,037 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:20,037 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:20,981 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:21,014 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:21,046 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:21,077 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:21,114 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:21,146 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:21,177 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:21,208 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:21,239 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:21,270 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:21,581 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5433099269866943 s; generated tokens: 20 tokens; generate speed: 12.959159822842524 tokens/s +2024-07-30 14:09:21,586 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:21,586 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[983/2067], cost time 1.5546s, every example cost time is 1.5546, generate speed: 12.8650 tokens/s, avg speed: 10.3092 tokens/s, remaining time: 0:24:40 +pred is: + ['2'] + label is: + ['two'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:09:21,669 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:21,669 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 168, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:21,670 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:21,670 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:21,670 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:22,613 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:22,645 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:22,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:22,679 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.008882761001587 s; generated tokens: 3 tokens; generate speed: 2.9735863431958087 tokens/s +2024-07-30 14:09:22,684 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:22,684 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[984/2067], cost time 1.0202s, every example cost time is 1.0202, generate speed: 2.9406 tokens/s, avg speed: 10.3036 tokens/s, remaining time: 0:24:38 +pred is: + ['3'] + label is: + ['three'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:09:22,766 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:22,766 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 237, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:22,766 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:22,767 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:22,767 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:23,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:23,744 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:23,776 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:23,807 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:23,838 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:23,869 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:23,900 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:23,930 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:23,961 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:23,992 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:24,305 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5378594398498535 s; generated tokens: 20 tokens; generate speed: 13.00508972520445 tokens/s +2024-07-30 14:09:24,309 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:24,310 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[985/2067], cost time 1.5491s, every example cost time is 1.5491, generate speed: 12.9111 tokens/s, avg speed: 10.3066 tokens/s, remaining time: 0:24:37 +pred is: + ['The Parish Church of St Andrew'] + label is: + ['The Parish Church of St Andrew'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:09:24,392 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:24,393 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 195, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:24,393 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:24,393 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:24,393 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:25,337 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:25,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:25,401 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:25,432 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:25,462 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:25,493 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:25,524 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:25,555 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:25,586 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:25,617 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:25,926 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.532548427581787 s; generated tokens: 20 tokens; generate speed: 13.05015857251445 tokens/s +2024-07-30 14:09:25,931 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:25,931 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[986/2067], cost time 1.5439s, every example cost time is 1.5439, generate speed: 12.9539 tokens/s, avg speed: 10.3097 tokens/s, remaining time: 0:24:36 +pred is: + ['1'] + label is: + ['City Road'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:09:26,013 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:26,014 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:26,014 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:26,014 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:26,015 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:26,957 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:26,989 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:27,021 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:27,052 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:27,083 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:27,086 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0711820125579834 s; generated tokens: 5 tokens; generate speed: 4.667740814709908 tokens/s +2024-07-30 14:09:27,091 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:27,091 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[987/2067], cost time 1.0824s, every example cost time is 1.0824, generate speed: 4.6196 tokens/s, avg speed: 10.3051 tokens/s, remaining time: 0:24:34 +pred is: + ['NE1fm'] + label is: + ['NE1fm'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:09:27,174 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:27,174 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 281, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:27,174 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:27,175 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:27,175 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:28,119 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:28,152 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:28,184 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:28,215 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:28,246 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:28,276 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:28,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:28,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:28,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:28,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:28,711 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5361485481262207 s; generated tokens: 20 tokens; generate speed: 13.019574197037004 tokens/s +2024-07-30 14:09:28,716 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:28,717 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[988/2067], cost time 1.5479s, every example cost time is 1.5479, generate speed: 12.9204 tokens/s, avg speed: 10.3081 tokens/s, remaining time: 0:24:33 +pred is: + ['1770'] + label is: + ['1770'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:09:28,799 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:28,799 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 176, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:28,799 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:28,800 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:28,800 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:29,743 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:29,775 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:29,807 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:29,838 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:29,869 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:29,900 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:29,903 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1033520698547363 s; generated tokens: 6 tokens; generate speed: 5.437974118986282 tokens/s +2024-07-30 14:09:29,908 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:29,908 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[989/2067], cost time 1.1146s, every example cost time is 1.1146, generate speed: 5.3832 tokens/s, avg speed: 10.3040 tokens/s, remaining time: 0:24:31 +pred is: + ['Rutherford Grammar School'] + label is: + ['Rutherford Grammar School'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:09:29,991 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:29,991 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 213, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:29,992 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:29,992 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:29,992 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:30,936 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:30,969 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:31,000 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:31,031 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:31,062 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:31,093 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:31,124 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:31,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:31,186 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:31,217 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:31,527 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5350072383880615 s; generated tokens: 20 tokens; generate speed: 13.029254520651223 tokens/s +2024-07-30 14:09:31,532 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:31,532 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[990/2067], cost time 1.5462s, every example cost time is 1.5462, generate speed: 12.9348 tokens/s, avg speed: 10.3070 tokens/s, remaining time: 0:24:30 +pred is: + ['in the Brompton district of the Royal Borough of Kensington and Chelsea'] + label is: + ['The V&A is located in the Brompton district of the Royal Borough of Kensington and Chelsea'] +The F1/Em of this example is: {'F1': 82.14285714285715, 'Em': 0.0} +F1 score: 62.348554828650606, Em score: 48.18181818181818, current_count: 990 +2024-07-30 14:09:31,909 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:31,909 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 238, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:31,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:31,910 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:31,910 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:32,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:32,887 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:32,919 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:32,950 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:32,981 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:33,012 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:33,043 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:33,075 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:33,106 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:33,137 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:33,447 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5366017818450928 s; generated tokens: 20 tokens; generate speed: 13.015733963281471 tokens/s +2024-07-30 14:09:33,452 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:33,452 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[991/2067], cost time 1.5482s, every example cost time is 1.5482, generate speed: 12.9186 tokens/s, avg speed: 10.3100 tokens/s, remaining time: 0:24:29 +pred is: + ['12.5'] + label is: + ['12.5'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:09:33,534 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:33,534 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 245, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:33,535 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:33,535 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:33,535 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:34,479 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:34,511 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:34,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:34,574 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:34,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:34,638 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:34,669 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:34,700 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:34,731 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:34,762 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:35,072 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5363540649414062 s; generated tokens: 20 tokens; generate speed: 13.017832579342812 tokens/s +2024-07-30 14:09:35,076 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:35,077 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[992/2067], cost time 1.5477s, every example cost time is 1.5477, generate speed: 12.9228 tokens/s, avg speed: 10.3130 tokens/s, remaining time: 0:24:28 +pred is: + ['The Great Exhibition of 1851'] + label is: + ['Great Exhibition of 1851'] +The F1/Em of this example is: {'F1': 87.50000000000001, 'Em': 0.0} +2024-07-30 14:09:35,159 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:35,159 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 307, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:35,160 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:35,160 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:35,160 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:36,105 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:36,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:36,170 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:36,201 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:36,232 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:36,263 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:36,294 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:36,325 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:36,356 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:36,388 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:36,701 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5403187274932861 s; generated tokens: 20 tokens; generate speed: 12.984325674302479 tokens/s +2024-07-30 14:09:36,706 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:36,706 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[993/2067], cost time 1.5515s, every example cost time is 1.5515, generate speed: 12.8904 tokens/s, avg speed: 10.3160 tokens/s, remaining time: 0:24:27 +pred is: + ['Queen Victoria'] + label is: + ['Queen Victoria'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:09:36,788 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:36,788 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 153, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:36,789 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:36,789 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:36,789 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:37,732 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:37,766 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:37,798 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:37,829 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:37,861 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:37,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:37,922 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:37,953 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:37,984 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:38,015 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:38,323 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.533613681793213 s; generated tokens: 20 tokens; generate speed: 13.04109388005364 tokens/s +2024-07-30 14:09:38,328 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:38,328 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[994/2067], cost time 1.5448s, every example cost time is 1.5448, generate speed: 12.9470 tokens/s, avg speed: 10.3189 tokens/s, remaining time: 0:24:26 +pred is: + ['September 1946'] + label is: + ['between September and November 1946'] +The F1/Em of this example is: {'F1': 33.33333333333333, 'Em': 0.0} +2024-07-30 14:09:38,411 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:38,411 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 159, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:38,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:38,411 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:38,412 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:39,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:39,387 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:39,418 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:39,457 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:39,488 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:39,519 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:39,550 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:39,581 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:39,612 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:39,643 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:39,954 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5420334339141846 s; generated tokens: 20 tokens; generate speed: 12.969887396820877 tokens/s +2024-07-30 14:09:39,959 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:39,959 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[995/2067], cost time 1.5534s, every example cost time is 1.5534, generate speed: 12.8750 tokens/s, avg speed: 10.3219 tokens/s, remaining time: 0:24:24 +pred is: + ['a rock concert'] + label is: + ['a rock concert'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:09:40,041 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:40,042 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 213, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:40,042 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:40,042 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:40,042 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:40,986 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:41,018 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:41,049 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:41,080 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:41,111 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:41,114 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.071012020111084 s; generated tokens: 5 tokens; generate speed: 4.668481684716673 tokens/s +2024-07-30 14:09:41,118 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:41,119 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[996/2067], cost time 1.0822s, every example cost time is 1.0822, generate speed: 4.6203 tokens/s, avg speed: 10.3173 tokens/s, remaining time: 0:24:23 +pred is: + ['Dundee'] + label is: + ['Dundee'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:09:41,202 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:41,202 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 345, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:41,203 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:41,203 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:41,203 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:42,149 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:42,182 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:42,213 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:42,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:42,276 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:42,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:42,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:42,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:42,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:42,431 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:42,743 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5397226810455322 s; generated tokens: 20 tokens; generate speed: 12.98935207372487 tokens/s +2024-07-30 14:09:42,748 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:42,748 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[997/2067], cost time 1.5511s, every example cost time is 1.5511, generate speed: 12.8938 tokens/s, avg speed: 10.3203 tokens/s, remaining time: 0:24:22 +pred is: + ['Brompton Park House'] + label is: + ['Brompton Park House'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:09:42,830 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:42,830 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 501, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:42,830 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:42,831 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:42,831 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:43,778 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:43,811 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:43,843 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:43,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:43,905 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:43,908 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0768308639526367 s; generated tokens: 5 tokens; generate speed: 4.643254727717314 tokens/s +2024-07-30 14:09:43,913 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:43,913 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[998/2067], cost time 1.0879s, every example cost time is 1.0879, generate speed: 4.5959 tokens/s, avg speed: 10.3157 tokens/s, remaining time: 0:24:20 +pred is: + ['Owen Jones'] + label is: + ['Oriental Courts'] +The F1/Em of this example is: {'F1': 33.33333333333333, 'Em': 0.0} +2024-07-30 14:09:43,994 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:43,994 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 323, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:43,995 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:43,995 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:43,995 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:44,941 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:44,974 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:45,005 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:45,036 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:45,067 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:45,098 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:45,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:45,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:45,190 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:45,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:45,532 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5365359783172607 s; generated tokens: 20 tokens; generate speed: 13.016291373732116 tokens/s +2024-07-30 14:09:45,537 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:45,537 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[999/2067], cost time 1.5478s, every example cost time is 1.5478, generate speed: 12.9218 tokens/s, avg speed: 10.3187 tokens/s, remaining time: 0:24:19 +pred is: + ['Philip Webb and William Morris'] + label is: + ['Philip Webb and William Morris'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:09:45,620 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:45,620 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 244, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:45,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:45,621 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:45,621 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:46,564 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:46,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:46,628 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:46,659 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:46,690 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:46,721 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:46,752 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:46,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:46,813 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:46,844 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:47,032 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4109320640563965 s; generated tokens: 16 tokens; generate speed: 11.34002154150525 tokens/s +2024-07-30 14:09:47,037 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:47,037 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1000/2067], cost time 1.4222s, every example cost time is 1.4222, generate speed: 11.2498 tokens/s, avg speed: 10.3196 tokens/s, remaining time: 0:24:17 +pred is: + ['Colonel (later Major General) Henry Young Darracott Scott'] + label is: + ['Henry Young Darracott Scott'] +The F1/Em of this example is: {'F1': 58.333333333333336, 'Em': 0.0} +F1 score: 62.53756928036411, Em score: 48.3, current_count: 1000 +2024-07-30 14:09:47,408 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:47,408 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 358, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:47,408 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:47,409 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:47,409 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:48,355 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:48,388 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:48,420 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:48,451 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:48,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:48,515 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:48,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:48,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:48,611 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:48,643 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:48,677 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.268362045288086 s; generated tokens: 11 tokens; generate speed: 8.672602622306902 tokens/s +2024-07-30 14:09:48,682 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:48,682 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1001/2067], cost time 1.2796s, every example cost time is 1.2796, generate speed: 8.5965 tokens/s, avg speed: 10.3180 tokens/s, remaining time: 0:24:16 +pred is: + ['Sgraffito'] + label is: + ['sgraffito'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:09:48,765 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:48,765 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 251, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:48,766 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:48,766 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:48,766 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:49,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:49,756 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:49,788 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:49,820 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:49,851 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:49,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:49,914 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:49,945 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:49,976 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:50,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:50,330 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5632848739624023 s; generated tokens: 20 tokens; generate speed: 12.793573540634801 tokens/s +2024-07-30 14:09:50,334 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:50,335 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1002/2067], cost time 1.5745s, every example cost time is 1.5745, generate speed: 12.7021 tokens/s, avg speed: 10.3207 tokens/s, remaining time: 0:24:15 +pred is: + ['Aston Webb'] + label is: + ['Aston Webb'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:09:50,417 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:50,418 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 193, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:50,418 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:50,418 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:50,419 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:51,363 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:51,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:51,402 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 0.9829874038696289 s; generated tokens: 2 tokens; generate speed: 2.0346140674100184 tokens/s +2024-07-30 14:09:51,407 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:51,407 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1003/2067], cost time 0.9943s, every example cost time is 0.9943, generate speed: 2.0114 tokens/s, avg speed: 10.3147 tokens/s, remaining time: 0:24:13 +pred is: + ['A'] + label is: + ['Alfred Drury'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:09:51,490 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:51,490 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 338, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:51,490 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:51,491 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:51,491 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:52,437 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:52,471 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:52,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:52,536 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:52,567 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:52,599 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:52,631 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:52,662 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:52,694 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:52,726 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:53,041 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.549483060836792 s; generated tokens: 20 tokens; generate speed: 12.907530585845244 tokens/s +2024-07-30 14:09:53,045 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:53,046 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1004/2067], cost time 1.5609s, every example cost time is 1.5609, generate speed: 12.8133 tokens/s, avg speed: 10.3176 tokens/s, remaining time: 0:24:12 +pred is: + ['The Art Library'] + label is: + ['Art Library'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:09:53,128 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:53,129 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 470, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:53,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:53,129 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:53,130 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:54,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:54,110 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:54,142 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:54,173 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:54,205 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:54,236 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:54,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:54,299 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:54,330 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:54,361 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:54,681 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.55088210105896 s; generated tokens: 20 tokens; generate speed: 12.89588679006855 tokens/s +2024-07-30 14:09:54,686 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:54,686 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1005/2067], cost time 1.5621s, every example cost time is 1.5621, generate speed: 12.8031 tokens/s, avg speed: 10.3204 tokens/s, remaining time: 0:24:11 +pred is: + ['The main silverware gallery'] + label is: + ['main silverware gallery'] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +2024-07-30 14:09:54,769 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:54,769 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 227, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:54,770 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:54,770 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:54,770 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:55,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:55,747 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:55,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:55,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:55,841 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:55,871 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:55,902 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:55,933 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:55,964 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:56,011 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:56,322 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5513970851898193 s; generated tokens: 20 tokens; generate speed: 12.891606018167119 tokens/s +2024-07-30 14:09:56,327 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:56,327 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1006/2067], cost time 1.5627s, every example cost time is 1.5627, generate speed: 12.7987 tokens/s, avg speed: 10.3232 tokens/s, remaining time: 0:24:10 +pred is: + ['Kim Wilkie'] + label is: + ['Kim Wilkie'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:09:56,409 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:56,409 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 174, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:56,410 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:56,410 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:56,410 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:57,352 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:57,386 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:57,418 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:57,449 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:57,480 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:57,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:57,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:57,574 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:57,605 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:57,636 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:57,946 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5354278087615967 s; generated tokens: 20 tokens; generate speed: 13.025685666153887 tokens/s +2024-07-30 14:09:57,951 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:57,951 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1007/2067], cost time 1.5467s, every example cost time is 1.5467, generate speed: 12.9308 tokens/s, avg speed: 10.3261 tokens/s, remaining time: 0:24:08 +pred is: + ['2004'] + label is: + ['2004'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:09:58,034 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:58,034 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 281, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:58,034 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:58,035 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:58,035 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:09:58,980 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:59,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:59,045 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:59,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:59,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:59,140 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:59,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:59,203 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:59,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:59,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:59,584 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5487570762634277 s; generated tokens: 20 tokens; generate speed: 12.91358102992661 tokens/s +2024-07-30 14:09:59,589 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:09:59,589 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1008/2067], cost time 1.5601s, every example cost time is 1.5601, generate speed: 12.8201 tokens/s, avg speed: 10.3290 tokens/s, remaining time: 0:24:07 +pred is: + ['Palladio'] + label is: + ['Andrea Palladio'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:09:59,672 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:09:59,673 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 250, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:09:59,673 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:09:59,673 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:09:59,673 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:00,617 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:00,650 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:00,682 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:00,713 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:00,744 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:00,775 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:00,806 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:00,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:00,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:00,899 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:01,209 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5355274677276611 s; generated tokens: 20 tokens; generate speed: 13.024840271725553 tokens/s +2024-07-30 14:10:01,214 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:01,214 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1009/2067], cost time 1.5471s, every example cost time is 1.5471, generate speed: 12.9273 tokens/s, avg speed: 10.3319 tokens/s, remaining time: 0:24:06 +pred is: + ['Bishopsgate'] + label is: + ['Bishopsgate'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:10:01,297 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:01,297 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 319, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:01,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:01,298 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:01,298 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:02,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:02,277 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:02,308 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:02,339 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:02,370 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:02,401 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:02,432 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:02,464 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:02,495 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:02,526 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:02,863 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5648117065429688 s; generated tokens: 20 tokens; generate speed: 12.781090476492299 tokens/s +2024-07-30 14:10:02,868 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:02,868 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1010/2067], cost time 1.5761s, every example cost time is 1.5761, generate speed: 12.6899 tokens/s, avg speed: 10.3346 tokens/s, remaining time: 0:24:05 +pred is: + ['19,000'] + label is: + ['over 19,000'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +F1 score: 62.69396298385885, Em score: 48.31683168316832, current_count: 1010 +2024-07-30 14:10:03,265 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:03,265 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 277, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:03,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:03,266 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:03,266 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:04,211 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:04,245 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:04,277 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:04,309 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:04,340 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:04,371 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:04,402 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:04,433 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:04,464 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:04,495 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:04,828 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5616650581359863 s; generated tokens: 20 tokens; generate speed: 12.806843500662128 tokens/s +2024-07-30 14:10:04,833 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:04,833 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1011/2067], cost time 1.5735s, every example cost time is 1.5735, generate speed: 12.7106 tokens/s, avg speed: 10.3373 tokens/s, remaining time: 0:24:04 +pred is: + ['6000'] + label is: + ['nearly 60,000'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:10:04,915 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:04,915 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 313, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:04,916 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:04,916 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:04,916 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:05,861 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:05,894 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:05,926 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:05,957 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:05,988 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:06,018 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:06,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:06,080 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:06,111 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:06,142 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:06,454 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5373964309692383 s; generated tokens: 20 tokens; generate speed: 13.009006393615193 tokens/s +2024-07-30 14:10:06,459 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:06,459 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1012/2067], cost time 1.5486s, every example cost time is 1.5486, generate speed: 12.9145 tokens/s, avg speed: 10.3402 tokens/s, remaining time: 0:24:03 +pred is: + ['70,000'] + label is: + ['more than 70,000'] +The F1/Em of this example is: {'F1': 60.0, 'Em': 0.0} +2024-07-30 14:10:06,541 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:06,542 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 271, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:06,542 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:06,542 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:06,542 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:07,487 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:07,520 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:07,551 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:07,583 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:07,614 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:07,645 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:07,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:07,679 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1360220909118652 s; generated tokens: 7 tokens; generate speed: 6.161852006223947 tokens/s +2024-07-30 14:10:07,683 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:07,684 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1013/2067], cost time 1.1473s, every example cost time is 1.1473, generate speed: 6.1013 tokens/s, avg speed: 10.3366 tokens/s, remaining time: 0:24:01 +pred is: + ['Ando Cloisonné'] + label is: + ['Toshiba'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:10:07,765 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:07,766 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 245, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:07,766 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:07,766 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:07,766 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:08,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:08,743 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:08,775 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:08,806 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:08,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:08,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:08,899 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:08,930 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:08,961 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:08,992 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:09,118 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3513596057891846 s; generated tokens: 14 tokens; generate speed: 10.359936718564336 tokens/s +2024-07-30 14:10:09,123 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:09,123 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1014/2067], cost time 1.3625s, every example cost time is 1.3625, generate speed: 10.2753 tokens/s, avg speed: 10.3366 tokens/s, remaining time: 0:24:00 +pred is: + ['14th-15th century'] + label is: + ['from the 14th to the 19th century'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 14:10:09,206 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:09,207 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 276, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:09,207 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:09,231 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:09,231 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:10,177 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:10,211 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:10,242 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:10,274 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:10,305 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:10,336 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:10,367 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:10,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:10,430 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:10,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:10,773 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.541295051574707 s; generated tokens: 20 tokens; generate speed: 12.976100831288884 tokens/s +2024-07-30 14:10:10,777 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:10,778 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1015/2067], cost time 1.5762s, every example cost time is 1.5762, generate speed: 12.6887 tokens/s, avg speed: 10.3392 tokens/s, remaining time: 0:23:59 +pred is: + ['Leonardo da Vinci'] + label is: + ['Leonardo da Vinci'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:10:10,860 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:10,860 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 176, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:10,861 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:10,861 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:10,861 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:11,804 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:11,838 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:11,870 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:11,921 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:11,953 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:11,984 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:12,015 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:12,046 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:12,077 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:12,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:12,141 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2800779342651367 s; generated tokens: 11 tokens; generate speed: 8.593226791550663 tokens/s +2024-07-30 14:10:12,146 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:12,146 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1016/2067], cost time 1.2912s, every example cost time is 1.2912, generate speed: 8.5193 tokens/s, avg speed: 10.3376 tokens/s, remaining time: 0:23:57 +pred is: + ['1'] + label is: + ['Charles Dickens'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:10:12,229 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:12,229 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 209, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:12,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:12,230 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:12,230 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:13,172 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:13,205 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:13,237 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:13,268 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:13,299 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:13,331 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:13,364 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:13,397 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:13,428 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:13,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:13,775 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.544572353363037 s; generated tokens: 20 tokens; generate speed: 12.948567903894878 tokens/s +2024-07-30 14:10:13,779 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:13,780 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1017/2067], cost time 1.5558s, every example cost time is 1.5558, generate speed: 12.8551 tokens/s, avg speed: 10.3404 tokens/s, remaining time: 0:23:56 +pred is: + ['Word and Image Department'] + label is: + ['Word and Image Department'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:10:13,862 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:13,863 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 352, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:13,863 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:13,863 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:13,864 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:14,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:14,843 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:14,875 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:14,906 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:14,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:14,969 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:15,000 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:15,031 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:15,062 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:15,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:15,128 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2638115882873535 s; generated tokens: 11 tokens; generate speed: 8.703829037448994 tokens/s +2024-07-30 14:10:15,132 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:15,133 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1018/2067], cost time 1.2753s, every example cost time is 1.2753, generate speed: 8.6257 tokens/s, avg speed: 10.3388 tokens/s, remaining time: 0:23:54 +pred is: + ['2007'] + label is: + ['2007'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:10:15,215 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:15,215 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 215, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:15,216 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:15,216 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:15,216 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:16,160 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:16,194 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:16,225 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:16,256 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:16,287 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:16,319 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:16,349 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:16,380 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:16,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:16,442 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:16,751 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5345642566680908 s; generated tokens: 20 tokens; generate speed: 13.033015667538631 tokens/s +2024-07-30 14:10:16,756 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:16,756 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1019/2067], cost time 1.5461s, every example cost time is 1.5461, generate speed: 12.9361 tokens/s, avg speed: 10.3417 tokens/s, remaining time: 0:23:53 +pred is: + ['Horace Walpole'] + label is: + ['British patrons'] +The F1/Em of this example is: {'F1': 33.33333333333333, 'Em': 0.0} +2024-07-30 14:10:16,839 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:16,839 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 313, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:16,839 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:16,840 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:16,840 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:17,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:17,819 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:17,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:17,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:17,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:17,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:17,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:18,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:18,033 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:18,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:18,371 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.531447410583496 s; generated tokens: 20 tokens; generate speed: 13.059540838153763 tokens/s +2024-07-30 14:10:18,376 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:18,377 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1020/2067], cost time 1.5429s, every example cost time is 1.5429, generate speed: 12.9630 tokens/s, avg speed: 10.3446 tokens/s, remaining time: 0:23:52 +pred is: + ['The increase in tea drinking'] + label is: + ['increase in tea drinking'] +The F1/Em of this example is: {'F1': 87.50000000000001, 'Em': 0.0} +F1 score: 62.575231320618414, Em score: 48.13725490196079, current_count: 1020 +2024-07-30 14:10:18,781 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:18,781 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 190, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:18,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:18,782 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:18,782 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:19,727 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:19,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:19,791 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:19,822 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:19,853 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:19,885 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:19,917 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:19,947 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:19,978 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:20,009 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:20,339 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5564699172973633 s; generated tokens: 20 tokens; generate speed: 12.849589817147107 tokens/s +2024-07-30 14:10:20,344 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:20,344 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1021/2067], cost time 1.5685s, every example cost time is 1.5685, generate speed: 12.7513 tokens/s, avg speed: 10.3473 tokens/s, remaining time: 0:23:51 +pred is: + ["Trajan's Column"] + label is: + ["Trajan's Column"] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:10:20,427 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:20,428 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 247, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:20,428 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:20,428 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:20,428 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:21,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:21,406 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:21,438 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:21,469 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:21,499 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:21,530 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:21,561 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:21,592 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:21,623 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:21,654 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:21,933 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5042126178741455 s; generated tokens: 19 tokens; generate speed: 12.631193073524459 tokens/s +2024-07-30 14:10:21,938 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:21,938 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1022/2067], cost time 1.5156s, every example cost time is 1.5156, generate speed: 12.5365 tokens/s, avg speed: 10.3497 tokens/s, remaining time: 0:23:50 +pred is: + ['1731'] + label is: + ['1731'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:10:22,020 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:22,020 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:22,021 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:22,021 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:22,021 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:22,965 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:22,998 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:23,029 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:23,060 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:23,091 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:23,121 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:23,152 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:23,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:23,213 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:23,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:23,577 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5555555820465088 s; generated tokens: 20 tokens; generate speed: 12.857142638187023 tokens/s +2024-07-30 14:10:23,582 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:23,582 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1023/2067], cost time 1.5668s, every example cost time is 1.5668, generate speed: 12.7645 tokens/s, avg speed: 10.3524 tokens/s, remaining time: 0:23:49 +pred is: + ['Josiah Wedgwood, William De Morgan and Bernard Leach'] + label is: + ['Josiah Wedgwood, William De Morgan and Bernard Leach'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:10:23,665 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:23,666 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 311, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:23,666 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:23,666 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:23,667 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:24,612 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:24,645 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:24,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:24,707 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:24,710 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0433073043823242 s; generated tokens: 4 tokens; generate speed: 3.833961463893081 tokens/s +2024-07-30 14:10:24,715 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:24,715 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1024/2067], cost time 1.0544s, every example cost time is 1.0544, generate speed: 3.7935 tokens/s, avg speed: 10.3474 tokens/s, remaining time: 0:23:47 +pred is: + ['4000'] + label is: + ['4000'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:10:24,797 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:24,797 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 234, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:24,798 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:24,798 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:24,798 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:25,742 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:25,775 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:25,806 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:25,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:25,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:25,899 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:25,930 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:25,961 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:25,991 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:26,022 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:26,332 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5335335731506348 s; generated tokens: 20 tokens; generate speed: 13.041775119999578 tokens/s +2024-07-30 14:10:26,337 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:26,337 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1025/2067], cost time 1.5448s, every example cost time is 1.5448, generate speed: 12.9465 tokens/s, avg speed: 10.3503 tokens/s, remaining time: 0:23:46 +pred is: + ['1994'] + label is: + ['1994'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:10:26,419 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:26,419 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 222, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:26,420 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:26,420 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:26,420 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:27,365 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:27,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:27,430 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:27,461 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:27,492 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:27,523 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:27,554 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:27,585 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:27,616 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:27,647 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:27,957 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5359861850738525 s; generated tokens: 20 tokens; generate speed: 13.020950444966646 tokens/s +2024-07-30 14:10:27,961 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:27,962 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1026/2067], cost time 1.5473s, every example cost time is 1.5473, generate speed: 12.9261 tokens/s, avg speed: 10.3531 tokens/s, remaining time: 0:23:44 +pred is: + ['10,000'] + label is: + ['over 10,000'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:10:28,044 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:28,044 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 175, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:28,045 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:28,045 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:28,045 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:28,988 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:29,021 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:29,052 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:29,082 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:29,113 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:29,116 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0708403587341309 s; generated tokens: 5 tokens; generate speed: 4.669230067038783 tokens/s +2024-07-30 14:10:29,121 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:29,121 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1027/2067], cost time 1.0819s, every example cost time is 1.0819, generate speed: 4.6214 tokens/s, avg speed: 10.3487 tokens/s, remaining time: 0:23:43 +pred is: + ['14,000'] + label is: + ['over 14,000'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:10:29,217 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:29,217 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:29,218 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:29,218 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:29,218 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:30,161 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:30,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:30,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:30,257 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:30,288 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:30,319 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:30,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:30,381 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:30,412 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:30,443 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:30,755 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5365064144134521 s; generated tokens: 20 tokens; generate speed: 13.016541820057956 tokens/s +2024-07-30 14:10:30,760 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:30,760 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1028/2067], cost time 1.5484s, every example cost time is 1.5484, generate speed: 12.9167 tokens/s, avg speed: 10.3515 tokens/s, remaining time: 0:23:42 +pred is: + ['2002'] + label is: + ['2002'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:10:30,843 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:30,843 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 330, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:30,844 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:30,844 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:30,844 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:31,790 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:31,823 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:31,855 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:31,887 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:31,918 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:31,949 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:31,981 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:32,012 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:32,043 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:32,074 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:32,390 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.545715570449829 s; generated tokens: 20 tokens; generate speed: 12.938991094059864 tokens/s +2024-07-30 14:10:32,395 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:32,395 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1029/2067], cost time 1.5577s, every example cost time is 1.5577, generate speed: 12.8394 tokens/s, avg speed: 10.3543 tokens/s, remaining time: 0:23:40 +pred is: + ['Renaissance'] + label is: + ['Italian and French Renaissance'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 14:10:32,479 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:32,479 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 261, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:32,479 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:32,480 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:32,480 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:33,424 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:33,459 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:33,492 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:33,523 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:33,554 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:33,586 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:33,617 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:33,648 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:33,679 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:33,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:34,022 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5423188209533691 s; generated tokens: 20 tokens; generate speed: 12.967487479428668 tokens/s +2024-07-30 14:10:34,027 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:34,028 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1030/2067], cost time 1.5540s, every example cost time is 1.5540, generate speed: 12.8702 tokens/s, avg speed: 10.3571 tokens/s, remaining time: 0:23:39 +pred is: + ['1580'] + label is: + ['1580'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.81721936604931, Em score: 48.349514563106794, current_count: 1030 +2024-07-30 14:10:34,407 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:34,407 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 338, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:34,407 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:34,408 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:34,408 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:35,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:35,388 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:35,419 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:35,451 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:35,454 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0455570220947266 s; generated tokens: 4 tokens; generate speed: 3.825711955897135 tokens/s +2024-07-30 14:10:35,459 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:35,459 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1031/2067], cost time 1.0576s, every example cost time is 1.0576, generate speed: 3.7823 tokens/s, avg speed: 10.3521 tokens/s, remaining time: 0:23:38 +pred is: + ['6000'] + label is: + ['over 6000'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:10:35,541 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:35,541 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 378, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:35,542 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:35,542 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:35,542 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:36,489 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:36,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:36,554 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:36,587 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:36,618 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:36,649 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:36,652 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1099133491516113 s; generated tokens: 6 tokens; generate speed: 5.405827404982779 tokens/s +2024-07-30 14:10:36,657 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:36,657 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1032/2067], cost time 1.1214s, every example cost time is 1.1214, generate speed: 5.3506 tokens/s, avg speed: 10.3482 tokens/s, remaining time: 0:23:36 +pred is: + ['secular and sacred'] + label is: + ['secular and sacred'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:10:36,740 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:36,740 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 253, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:36,741 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:36,741 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:36,741 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:37,686 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:37,719 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:37,750 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:37,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:37,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:37,817 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.075481653213501 s; generated tokens: 5 tokens; generate speed: 4.6490797728256705 tokens/s +2024-07-30 14:10:37,822 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:37,822 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1033/2067], cost time 1.0868s, every example cost time is 1.0868, generate speed: 4.6007 tokens/s, avg speed: 10.3437 tokens/s, remaining time: 0:23:34 +pred is: + ['c1110'] + label is: + ['c1110'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:10:37,904 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:37,904 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 225, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:37,904 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:37,905 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:37,905 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:38,849 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:38,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:38,914 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:38,945 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:38,976 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:39,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:39,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:39,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:39,101 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:39,104 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1985442638397217 s; generated tokens: 9 tokens; generate speed: 7.509109401739665 tokens/s +2024-07-30 14:10:39,108 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:39,109 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1034/2067], cost time 1.2099s, every example cost time is 1.2099, generate speed: 7.4385 tokens/s, avg speed: 10.3413 tokens/s, remaining time: 0:23:33 +pred is: + ['5100'] + label is: + ['over 5,100'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:10:39,193 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:39,193 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 246, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:39,193 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:39,193 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:39,194 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:40,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:40,172 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:40,204 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:40,235 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:40,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:40,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:40,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:40,360 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:40,391 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:40,422 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:40,734 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.540452241897583 s; generated tokens: 20 tokens; generate speed: 12.983200294066435 tokens/s +2024-07-30 14:10:40,739 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:40,740 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1035/2067], cost time 1.5519s, every example cost time is 1.5519, generate speed: 12.8878 tokens/s, avg speed: 10.3440 tokens/s, remaining time: 0:23:32 +pred is: + ['1130'] + label is: + ['1130'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:10:40,822 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:40,822 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 342, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:40,823 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:40,823 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:40,823 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:41,769 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:41,802 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:41,838 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:41,870 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:41,873 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0498311519622803 s; generated tokens: 4 tokens; generate speed: 3.810136508640884 tokens/s +2024-07-30 14:10:41,878 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:41,878 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1036/2067], cost time 1.0613s, every example cost time is 1.0613, generate speed: 3.7690 tokens/s, avg speed: 10.3391 tokens/s, remaining time: 0:23:30 +pred is: + ['1857'] + label is: + ['1857'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:10:41,960 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:41,961 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 175, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:41,961 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:41,961 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:41,962 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:42,905 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:42,939 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:42,975 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:43,006 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:43,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:43,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:43,101 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:43,103 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1416597366333008 s; generated tokens: 7 tokens; generate speed: 6.131424079684776 tokens/s +2024-07-30 14:10:43,108 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:43,109 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1037/2067], cost time 1.1530s, every example cost time is 1.1530, generate speed: 6.0710 tokens/s, avg speed: 10.3357 tokens/s, remaining time: 0:23:28 +pred is: + ['1600–1800'] + label is: + ['continental art 1600–1800'] +The F1/Em of this example is: {'F1': 60.0, 'Em': 0.0} +2024-07-30 14:10:43,192 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:43,192 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 233, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:43,192 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:43,193 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:43,193 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:44,137 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:44,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:44,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:44,233 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:44,265 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:44,296 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:44,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:44,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:44,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:44,422 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:44,739 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5461993217468262 s; generated tokens: 20 tokens; generate speed: 12.93494293957192 tokens/s +2024-07-30 14:10:44,744 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:44,745 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1038/2067], cost time 1.5581s, every example cost time is 1.5581, generate speed: 12.8365 tokens/s, avg speed: 10.3384 tokens/s, remaining time: 0:23:27 +pred is: + ['Eadweard Muybridge'] + label is: + ['Eadweard Muybridge'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:10:44,835 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:44,836 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 215, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:44,836 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:44,837 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:44,837 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:45,781 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:45,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:45,846 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:45,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:45,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:45,941 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:45,974 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:46,006 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:46,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:46,071 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:46,388 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5509190559387207 s; generated tokens: 20 tokens; generate speed: 12.895579510366293 tokens/s +2024-07-30 14:10:46,393 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:46,393 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1039/2067], cost time 1.5628s, every example cost time is 1.5628, generate speed: 12.7971 tokens/s, avg speed: 10.3411 tokens/s, remaining time: 0:23:26 +pred is: + ['post-classical European'] + label is: + ['post-classical European'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:10:46,477 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:46,477 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 512, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:46,478 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:46,478 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:46,478 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:47,426 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:47,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:47,492 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:47,523 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:47,555 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:47,587 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:47,618 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:47,649 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:47,687 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:47,719 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:48,038 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5597314834594727 s; generated tokens: 20 tokens; generate speed: 12.822719943845815 tokens/s +2024-07-30 14:10:48,043 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:48,043 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1040/2067], cost time 1.5718s, every example cost time is 1.5718, generate speed: 12.7239 tokens/s, avg speed: 10.3437 tokens/s, remaining time: 0:23:25 +pred is: + ['National Galleries of Scotland'] + label is: + ['National Galleries of Scotland'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.992053795221906, Em score: 48.55769230769231, current_count: 1040 +2024-07-30 14:10:48,427 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:48,427 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:48,428 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:48,428 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:48,428 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:49,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:49,405 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:49,437 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:49,469 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:49,501 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:49,532 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:49,564 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:49,595 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:49,626 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:49,659 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:49,792 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3637864589691162 s; generated tokens: 14 tokens; generate speed: 10.265536739954564 tokens/s +2024-07-30 14:10:49,797 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:49,798 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1041/2067], cost time 1.3759s, every example cost time is 1.3759, generate speed: 10.1750 tokens/s, avg speed: 10.3436 tokens/s, remaining time: 0:23:23 +pred is: + ['20'] + label is: + ['more than 20'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +2024-07-30 14:10:49,880 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:49,881 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 205, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:49,881 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:49,881 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:49,882 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:50,826 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:50,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:50,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:50,923 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:50,954 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:50,986 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:51,017 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:51,048 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:51,080 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:51,111 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:51,423 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5415992736816406 s; generated tokens: 20 tokens; generate speed: 12.973540103087936 tokens/s +2024-07-30 14:10:51,428 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:51,429 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1042/2067], cost time 1.5533s, every example cost time is 1.5533, generate speed: 12.8754 tokens/s, avg speed: 10.3463 tokens/s, remaining time: 0:23:22 +pred is: + ['4'] + label is: + ['George Frampton'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:10:51,512 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:51,512 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 240, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:51,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:51,513 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:51,513 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:52,457 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:52,490 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:52,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:52,553 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:52,586 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:52,616 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:52,647 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:52,679 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:52,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:52,741 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:53,058 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5449392795562744 s; generated tokens: 20 tokens; generate speed: 12.945492592915526 tokens/s +2024-07-30 14:10:53,064 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:53,064 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1043/2067], cost time 1.5573s, every example cost time is 1.5573, generate speed: 12.8425 tokens/s, avg speed: 10.3491 tokens/s, remaining time: 0:23:21 +pred is: + ['Dorothy and Michael Hintze'] + label is: + ['Dorothy and Michael Hintze'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:10:53,147 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:53,148 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 159, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:53,148 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:53,148 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:53,148 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:54,092 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:54,125 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:54,157 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:54,189 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:54,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:54,223 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0746374130249023 s; generated tokens: 5 tokens; generate speed: 4.652732111685875 tokens/s +2024-07-30 14:10:54,228 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:54,229 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1044/2067], cost time 1.0866s, every example cost time is 1.0866, generate speed: 4.6016 tokens/s, avg speed: 10.3447 tokens/s, remaining time: 0:23:19 +pred is: + ['53,000'] + label is: + ['more than 53,000'] +The F1/Em of this example is: {'F1': 60.0, 'Em': 0.0} +2024-07-30 14:10:54,312 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:54,312 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 258, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:54,312 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:54,313 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:54,313 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:55,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:55,291 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:55,323 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:55,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:55,386 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:55,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:55,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:55,480 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:55,511 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:55,542 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:55,854 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5411248207092285 s; generated tokens: 20 tokens; generate speed: 12.977534156380639 tokens/s +2024-07-30 14:10:55,859 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:55,859 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1045/2067], cost time 1.5528s, every example cost time is 1.5528, generate speed: 12.8803 tokens/s, avg speed: 10.3474 tokens/s, remaining time: 0:23:18 +pred is: + ['The Cloth of St Gereon'] + label is: + ['Cloth of St Gereon'] +The F1/Em of this example is: {'F1': 87.50000000000001, 'Em': 0.0} +2024-07-30 14:10:55,943 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:55,943 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:55,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:55,944 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:55,944 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:56,887 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:56,920 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:56,952 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:56,984 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:57,016 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:57,047 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:57,079 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:57,082 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1377780437469482 s; generated tokens: 7 tokens; generate speed: 6.152342311816365 tokens/s +2024-07-30 14:10:57,087 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:57,087 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1046/2067], cost time 1.1493s, every example cost time is 1.1493, generate speed: 6.0908 tokens/s, avg speed: 10.3440 tokens/s, remaining time: 0:23:17 +pred is: + ['Late 14th century'] + label is: + ['late 14th-century'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:10:57,171 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:57,171 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 157, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:57,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:57,172 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:57,172 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:58,115 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:58,158 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:58,191 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:58,222 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:58,253 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:58,285 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:58,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:58,348 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:58,380 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:58,412 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:58,730 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5574440956115723 s; generated tokens: 20 tokens; generate speed: 12.841552423200438 tokens/s +2024-07-30 14:10:58,735 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:10:58,735 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1047/2067], cost time 1.5692s, every example cost time is 1.5692, generate speed: 12.7456 tokens/s, avg speed: 10.3466 tokens/s, remaining time: 0:23:15 +pred is: + ['Theatre Museum'] + label is: + ['Theatre Museum'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:10:58,818 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:10:58,818 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 239, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:10:58,818 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:58,819 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:10:58,819 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:10:59,764 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:59,797 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:59,829 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:59,863 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:59,895 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:59,926 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:59,958 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:10:59,990 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:00,021 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:00,052 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:00,370 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5508110523223877 s; generated tokens: 20 tokens; generate speed: 12.896477601219942 tokens/s +2024-07-30 14:11:00,375 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:00,375 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1048/2067], cost time 1.5624s, every example cost time is 1.5624, generate speed: 12.8008 tokens/s, avg speed: 10.3493 tokens/s, remaining time: 0:23:14 +pred is: + ['preventive conservation'] + label is: + ['Conservation'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:11:00,469 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:00,469 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 144, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:00,470 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:00,470 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:00,470 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:01,413 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:01,447 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:01,479 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:01,510 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:01,540 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:01,572 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:01,575 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1050262451171875 s; generated tokens: 6 tokens; generate speed: 5.429735290462448 tokens/s +2024-07-30 14:11:01,580 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:01,581 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1049/2067], cost time 1.1169s, every example cost time is 1.1169, generate speed: 5.3721 tokens/s, avg speed: 10.3454 tokens/s, remaining time: 0:23:13 +pred is: + ['The Walt Disney Company'] + label is: + ['The Walt Disney Company'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:01,663 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:01,663 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 230, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:01,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:01,664 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:01,664 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:02,609 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:02,643 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:02,675 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:02,706 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:02,737 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:02,769 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:02,800 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:02,831 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:02,863 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:02,894 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:03,208 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5432765483856201 s; generated tokens: 20 tokens; generate speed: 12.959440108722873 tokens/s +2024-07-30 14:11:03,213 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:03,214 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1050/2067], cost time 1.5554s, every example cost time is 1.5554, generate speed: 12.8580 tokens/s, avg speed: 10.3482 tokens/s, remaining time: 0:23:11 +pred is: + ['1943'] + label is: + ['October 12, 1943'] +The F1/Em of this example is: {'F1': 28.57142857142857, 'Em': 0.0} +F1 score: 62.97251496089101, Em score: 48.38095238095238, current_count: 1050 +2024-07-30 14:11:03,600 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:03,601 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 191, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:03,601 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:03,602 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:03,602 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:04,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:04,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:04,609 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:04,640 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:04,672 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:04,703 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:04,733 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:04,764 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:04,795 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:04,826 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:05,136 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5341053009033203 s; generated tokens: 20 tokens; generate speed: 13.036914733443323 tokens/s +2024-07-30 14:11:05,141 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:05,141 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1051/2067], cost time 1.5460s, every example cost time is 1.5460, generate speed: 12.9362 tokens/s, avg speed: 10.3509 tokens/s, remaining time: 0:23:10 +pred is: + ['232'] + label is: + ['232'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:05,224 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:05,224 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 162, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:05,224 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:05,225 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:05,225 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:06,168 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:06,201 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:06,232 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:06,264 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:06,296 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:06,327 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:06,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:06,389 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:06,420 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:06,451 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:06,455 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.229839563369751 s; generated tokens: 10 tokens; generate speed: 8.131141896752839 tokens/s +2024-07-30 14:11:06,460 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:06,460 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1052/2067], cost time 1.2412s, every example cost time is 1.2412, generate speed: 8.0569 tokens/s, avg speed: 10.3490 tokens/s, remaining time: 0:23:09 +pred is: + ['Radio Corporation of America (RCA)'] + label is: + ['Radio Corporation of America'] +The F1/Em of this example is: {'F1': 77.77777777777779, 'Em': 0.0} +2024-07-30 14:11:06,543 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:06,543 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 223, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:06,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:06,544 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:06,544 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:07,488 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:07,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:07,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:07,584 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:07,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:07,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:07,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:07,708 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:07,738 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:07,770 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:08,080 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5358092784881592 s; generated tokens: 20 tokens; generate speed: 13.02245030039659 tokens/s +2024-07-30 14:11:08,085 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:08,085 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1053/2067], cost time 1.5474s, every example cost time is 1.5474, generate speed: 12.9249 tokens/s, avg speed: 10.3517 tokens/s, remaining time: 0:23:08 +pred is: + ['Mutual'] + label is: + ['Mutual'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:08,168 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:08,168 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 290, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:08,169 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:08,169 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:08,169 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:09,115 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:09,148 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:09,180 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:09,211 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:09,243 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:09,275 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:09,306 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:09,337 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:09,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:09,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:09,434 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2649168968200684 s; generated tokens: 11 tokens; generate speed: 8.696223465473025 tokens/s +2024-07-30 14:11:09,439 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:09,439 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1054/2067], cost time 1.2767s, every example cost time is 1.2767, generate speed: 8.6163 tokens/s, avg speed: 10.3502 tokens/s, remaining time: 0:23:06 +pred is: + ['Mark Woods'] + label is: + ['Mark Woods'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:09,522 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:09,522 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 228, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:09,523 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:09,523 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:09,523 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:10,467 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:10,501 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:10,532 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:10,563 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:10,594 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:10,597 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0740435123443604 s; generated tokens: 5 tokens; generate speed: 4.655304875950778 tokens/s +2024-07-30 14:11:10,602 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:10,602 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1055/2067], cost time 1.0856s, every example cost time is 1.0856, generate speed: 4.6056 tokens/s, avg speed: 10.3459 tokens/s, remaining time: 0:23:05 +pred is: + ['Life Savers'] + label is: + ['Life Savers candy'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:11:10,685 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:10,686 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 254, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:10,686 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:10,686 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:10,687 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:11,632 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:11,666 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:11,698 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:11,729 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:11,761 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:11,793 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:11,824 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:11,856 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:11,887 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:11,919 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:12,229 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5423781871795654 s; generated tokens: 20 tokens; generate speed: 12.966988360080832 tokens/s +2024-07-30 14:11:12,234 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:12,234 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1056/2067], cost time 1.5540s, every example cost time is 1.5540, generate speed: 12.8700 tokens/s, avg speed: 10.3486 tokens/s, remaining time: 0:23:03 +pred is: + ['1'] + label is: + ['Magnetophon tape recorder'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:11:12,317 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:12,318 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 273, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:12,318 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:12,318 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:12,319 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:13,263 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:13,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:13,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:13,360 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:13,391 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:13,422 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:13,453 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:13,485 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:13,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:13,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:13,550 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2310736179351807 s; generated tokens: 10 tokens; generate speed: 8.122991065938452 tokens/s +2024-07-30 14:11:13,555 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:13,555 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1057/2067], cost time 1.2423s, every example cost time is 1.2423, generate speed: 8.0497 tokens/s, avg speed: 10.3466 tokens/s, remaining time: 0:23:02 +pred is: + ['155'] + label is: + ['$155 million'] +The F1/Em of this example is: {'F1': 40.0, 'Em': 0.0} +2024-07-30 14:11:13,639 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:13,639 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 168, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:13,640 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:13,640 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:13,640 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:14,583 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:14,617 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:14,653 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:14,684 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:14,715 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:14,746 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:14,776 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:14,807 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:14,838 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:14,869 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:14,903 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.262418270111084 s; generated tokens: 11 tokens; generate speed: 8.713435364835204 tokens/s +2024-07-30 14:11:14,908 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:14,908 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1058/2067], cost time 1.2737s, every example cost time is 1.2737, generate speed: 8.6360 tokens/s, avg speed: 10.3451 tokens/s, remaining time: 0:23:00 +pred is: + ['1959'] + label is: + ['1959'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:14,990 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:14,991 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 264, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:14,991 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:14,991 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:14,992 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:15,937 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:15,970 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:16,001 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:16,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:16,063 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:16,095 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:16,126 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:16,157 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:16,188 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:16,251 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:16,563 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5715582370758057 s; generated tokens: 20 tokens; generate speed: 12.72622262934013 tokens/s +2024-07-30 14:11:16,568 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:16,569 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1059/2067], cost time 1.5832s, every example cost time is 1.5832, generate speed: 12.6323 tokens/s, avg speed: 10.3476 tokens/s, remaining time: 0:22:59 +pred is: + ['The coronation of Queen Elizabeth II in June 1953'] + label is: + ['coronation of Queen Elizabeth II'] +The F1/Em of this example is: {'F1': 69.23076923076924, 'Em': 0.0} +2024-07-30 14:11:16,651 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:16,652 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 183, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:16,652 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:16,652 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:16,653 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:17,596 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:17,630 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:17,661 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:17,692 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:17,723 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:17,754 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:17,786 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:17,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:17,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:17,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:17,882 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2289886474609375 s; generated tokens: 10 tokens; generate speed: 8.136771662341854 tokens/s +2024-07-30 14:11:17,887 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:17,887 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1060/2067], cost time 1.2404s, every example cost time is 1.2404, generate speed: 8.0619 tokens/s, avg speed: 10.3457 tokens/s, remaining time: 0:22:58 +pred is: + ['A Charlie Brown Christmas'] + label is: + ['Peanuts'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 63.00297099617369, Em score: 48.301886792452834, current_count: 1060 +2024-07-30 14:11:18,274 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:18,274 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 237, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:18,275 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:18,275 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:18,275 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:19,220 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:19,253 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:19,284 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:19,315 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:19,346 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:19,378 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:19,410 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:19,441 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:19,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:19,504 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:19,826 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5501742362976074 s; generated tokens: 20 tokens; generate speed: 12.90177551122733 tokens/s +2024-07-30 14:11:19,831 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:19,831 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1061/2067], cost time 1.5623s, every example cost time is 1.5623, generate speed: 12.8018 tokens/s, avg speed: 10.3483 tokens/s, remaining time: 0:22:57 +pred is: + ['1974'] + label is: + ['1974'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:19,916 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:19,917 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 280, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:19,917 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:19,917 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:19,918 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:20,863 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:20,896 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:20,928 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:20,959 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:20,963 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0452029705047607 s; generated tokens: 4 tokens; generate speed: 3.8270078758657533 tokens/s +2024-07-30 14:11:20,968 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:20,968 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1062/2067], cost time 1.0574s, every example cost time is 1.0574, generate speed: 3.7829 tokens/s, avg speed: 10.3435 tokens/s, remaining time: 0:22:55 +pred is: + ['General Hospital'] + label is: + ['General Hospital'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:21,050 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:21,050 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 376, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:21,051 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:21,051 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:21,051 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:21,998 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:22,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:22,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:22,097 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:22,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:22,160 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:22,191 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:22,223 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:22,254 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:22,257 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2053911685943604 s; generated tokens: 9 tokens; generate speed: 7.466455897876825 tokens/s +2024-07-30 14:11:22,262 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:22,262 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1063/2067], cost time 1.2168s, every example cost time is 1.2168, generate speed: 7.3967 tokens/s, avg speed: 10.3411 tokens/s, remaining time: 0:22:53 +pred is: + ['X Games'] + label is: + ['X Games'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:22,350 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:22,350 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 182, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:22,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:22,351 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:22,351 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:23,294 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:23,327 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:23,360 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:23,392 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:23,423 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:23,454 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:23,486 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:23,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:23,549 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:23,581 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:23,801 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.450242280960083 s; generated tokens: 17 tokens; generate speed: 11.722179268381097 tokens/s +2024-07-30 14:11:23,806 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:23,806 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1064/2067], cost time 1.4617s, every example cost time is 1.4617, generate speed: 11.6303 tokens/s, avg speed: 10.3424 tokens/s, remaining time: 0:22:52 +pred is: + ['Frank Marx'] + label is: + ['Frank Marx'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:23,889 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:23,889 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 217, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:23,889 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:23,890 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:23,890 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:24,833 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:24,866 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:24,903 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:24,935 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:24,966 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:24,998 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:25,029 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:25,061 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:25,092 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:25,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:25,188 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2984387874603271 s; generated tokens: 12 tokens; generate speed: 9.241868092581647 tokens/s +2024-07-30 14:11:25,193 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:25,194 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1065/2067], cost time 1.3098s, every example cost time is 1.3098, generate speed: 9.1618 tokens/s, avg speed: 10.3413 tokens/s, remaining time: 0:22:51 +pred is: + ['108'] + label is: + ['108'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:25,276 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:25,276 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 226, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:25,277 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:25,277 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:25,277 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:26,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:26,254 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:26,287 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:26,319 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:26,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:26,383 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:26,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:26,446 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:26,478 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:26,509 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:26,672 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3945305347442627 s; generated tokens: 15 tokens; generate speed: 10.75630803792388 tokens/s +2024-07-30 14:11:26,677 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:26,677 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1066/2067], cost time 1.4059s, every example cost time is 1.4059, generate speed: 10.6693 tokens/s, avg speed: 10.3416 tokens/s, remaining time: 0:22:49 +pred is: + ['1'] + label is: + ['U.S. Supreme Court'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:11:26,759 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:26,760 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 265, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:26,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:26,760 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:26,761 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:27,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:27,738 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:27,771 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:27,803 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:27,834 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:27,867 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:27,899 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:27,930 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:27,962 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:27,994 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:28,309 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5478155612945557 s; generated tokens: 20 tokens; generate speed: 12.921436184084156 tokens/s +2024-07-30 14:11:28,314 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:28,314 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1067/2067], cost time 1.5596s, every example cost time is 1.5596, generate speed: 12.8238 tokens/s, avg speed: 10.3443 tokens/s, remaining time: 0:22:48 +pred is: + ['Leonard Goldenson'] + label is: + ['Leonard Goldenson'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:28,397 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:28,397 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 313, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:28,397 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:28,398 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:28,398 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:29,344 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:29,377 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:29,409 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:29,441 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:29,473 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:29,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:29,537 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:29,569 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:29,601 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:29,632 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:29,667 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2687342166900635 s; generated tokens: 11 tokens; generate speed: 8.670058594854755 tokens/s +2024-07-30 14:11:29,671 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:29,672 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1068/2067], cost time 1.2803s, every example cost time is 1.2803, generate speed: 8.5919 tokens/s, avg speed: 10.3427 tokens/s, remaining time: 0:22:47 +pred is: + ['1952'] + label is: + ['1952'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:29,754 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:29,754 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 332, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:29,754 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:29,755 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:29,755 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:30,700 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:30,733 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:30,765 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:30,798 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:30,829 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:30,861 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:30,893 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:30,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:30,955 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:30,987 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:31,303 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5483951568603516 s; generated tokens: 20 tokens; generate speed: 12.916599429665991 tokens/s +2024-07-30 14:11:31,308 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:31,309 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1069/2067], cost time 1.5597s, every example cost time is 1.5597, generate speed: 12.8228 tokens/s, avg speed: 10.3454 tokens/s, remaining time: 0:22:45 +pred is: + ['August 10, 1948'] + label is: + ['August 10, 1948'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:31,391 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:31,392 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 201, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:31,392 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:31,392 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:31,393 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:32,336 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:32,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:32,401 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:32,432 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:32,463 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:32,494 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:32,526 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:32,557 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:32,588 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:32,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:32,653 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2606768608093262 s; generated tokens: 11 tokens; generate speed: 8.725471484372488 tokens/s +2024-07-30 14:11:32,658 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:32,658 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1070/2067], cost time 1.2720s, every example cost time is 1.2720, generate speed: 8.6475 tokens/s, avg speed: 10.3439 tokens/s, remaining time: 0:22:44 +pred is: + ['1960'] + label is: + ['September 30, 1960'] +The F1/Em of this example is: {'F1': 28.57142857142857, 'Em': 0.0} +F1 score: 63.188524004220135, Em score: 48.598130841121495, current_count: 1070 +2024-07-30 14:11:33,048 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:33,049 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 258, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:33,049 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:33,049 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:33,050 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:33,994 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:34,033 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:34,065 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:34,097 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:34,128 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:34,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:34,191 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:34,222 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:34,253 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:34,256 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2060484886169434 s; generated tokens: 9 tokens; generate speed: 7.4623865333315935 tokens/s +2024-07-30 14:11:34,261 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:34,261 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1071/2067], cost time 1.2177s, every example cost time is 1.2177, generate speed: 7.3910 tokens/s, avg speed: 10.3414 tokens/s, remaining time: 0:22:43 +pred is: + ['1959'] + label is: + ['1959'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:34,344 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:34,344 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 156, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:34,344 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:34,345 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:34,345 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:35,288 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:35,321 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:35,353 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:35,385 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:35,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:35,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:35,479 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:35,510 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:35,541 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:35,572 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:35,743 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3977386951446533 s; generated tokens: 15 tokens; generate speed: 10.731619616818032 tokens/s +2024-07-30 14:11:35,748 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:35,748 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1072/2067], cost time 1.4092s, every example cost time is 1.4092, generate speed: 10.6443 tokens/s, avg speed: 10.3417 tokens/s, remaining time: 0:22:41 +pred is: + ['The dot'] + label is: + ['circle logo'] +The F1/Em of this example is: {'F1': 33.33333333333333, 'Em': 0.0} +2024-07-30 14:11:35,831 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:35,831 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 319, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:35,832 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:35,832 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:35,832 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:36,778 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:36,811 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:36,842 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:36,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:36,906 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:36,937 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:36,969 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:37,001 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:37,033 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:37,065 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:37,320 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4876866340637207 s; generated tokens: 18 tokens; generate speed: 12.099322255004559 tokens/s +2024-07-30 14:11:37,325 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:37,325 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1073/2067], cost time 1.4991s, every example cost time is 1.4991, generate speed: 12.0069 tokens/s, avg speed: 10.3434 tokens/s, remaining time: 0:22:40 +pred is: + ['Pittard Sullivan'] + label is: + ['Pittard Sullivan'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:37,433 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:37,433 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 223, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:37,434 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:37,434 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:37,434 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:38,378 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:38,412 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:38,443 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:38,475 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:38,507 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:38,538 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:38,570 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:38,601 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:38,632 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:38,663 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:38,760 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3254806995391846 s; generated tokens: 13 tokens; generate speed: 9.807762575886294 tokens/s +2024-07-30 14:11:38,765 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:38,765 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1074/2067], cost time 1.3371s, every example cost time is 1.3371, generate speed: 9.7226 tokens/s, avg speed: 10.3429 tokens/s, remaining time: 0:22:39 +pred is: + ['1995-96'] + label is: + ['1993–94 season'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:11:38,848 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:38,848 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 155, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:38,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:38,849 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:38,849 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:39,792 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:39,825 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:39,856 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:39,888 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:39,919 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:39,951 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:39,982 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:40,034 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:40,066 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:40,098 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:40,411 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.561753273010254 s; generated tokens: 20 tokens; generate speed: 12.806120112333959 tokens/s +2024-07-30 14:11:40,416 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:40,416 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1075/2067], cost time 1.5731s, every example cost time is 1.5731, generate speed: 12.7140 tokens/s, avg speed: 10.3454 tokens/s, remaining time: 0:22:37 +pred is: + ['1977'] + label is: + ['1977'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:40,498 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:40,498 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 189, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:40,498 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:40,499 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:40,499 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:41,442 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:41,476 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:41,508 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:41,540 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:41,543 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0437920093536377 s; generated tokens: 4 tokens; generate speed: 3.832181089867681 tokens/s +2024-07-30 14:11:41,548 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:41,548 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1076/2067], cost time 1.0551s, every example cost time is 1.0551, generate speed: 3.7912 tokens/s, avg speed: 10.3407 tokens/s, remaining time: 0:22:36 +pred is: + ['Paul Rand'] + label is: + ['Paul Rand'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:41,654 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:41,655 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:41,655 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:41,655 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:41,656 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:42,599 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:42,632 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:42,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:42,696 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:42,727 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:42,759 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:42,790 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:42,821 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:42,852 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:42,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:42,886 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2304091453552246 s; generated tokens: 10 tokens; generate speed: 8.127377822043867 tokens/s +2024-07-30 14:11:42,891 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:42,891 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1077/2067], cost time 1.2420s, every example cost time is 1.2420, generate speed: 8.0518 tokens/s, avg speed: 10.3388 tokens/s, remaining time: 0:22:34 +pred is: + ['ABC Radio'] + label is: + ['ABC Radio'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:42,973 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:42,974 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 298, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:42,974 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:42,974 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:42,975 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:43,919 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:43,952 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:43,984 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:44,016 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:44,047 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:44,079 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:44,111 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:44,142 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:44,175 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:44,179 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2039098739624023 s; generated tokens: 9 tokens; generate speed: 7.475642649543604 tokens/s +2024-07-30 14:11:44,183 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:44,184 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1078/2067], cost time 1.2151s, every example cost time is 1.2151, generate speed: 7.4065 tokens/s, avg speed: 10.3364 tokens/s, remaining time: 0:22:33 +pred is: + ['2004'] + label is: + ['2004'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:44,266 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:44,266 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 180, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:44,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:44,267 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:44,267 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:45,210 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:45,243 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:45,274 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:45,306 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:45,336 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:45,368 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:45,399 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:45,431 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:45,462 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:45,493 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:45,527 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2598819732666016 s; generated tokens: 11 tokens; generate speed: 8.730976578289614 tokens/s +2024-07-30 14:11:45,532 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:45,532 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1079/2067], cost time 1.2714s, every example cost time is 1.2714, generate speed: 8.6516 tokens/s, avg speed: 10.3349 tokens/s, remaining time: 0:22:31 +pred is: + ['2002'] + label is: + ['2002'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:45,639 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:45,640 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 223, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:45,640 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:45,641 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:45,641 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:46,585 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:46,619 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:46,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:46,683 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:46,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:46,745 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:46,777 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:46,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:46,839 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:46,870 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:46,874 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2330257892608643 s; generated tokens: 10 tokens; generate speed: 8.11013045071384 tokens/s +2024-07-30 14:11:46,879 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:46,879 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1080/2067], cost time 1.2446s, every example cost time is 1.2446, generate speed: 8.0349 tokens/s, avg speed: 10.3330 tokens/s, remaining time: 0:22:30 +pred is: + ['Time Warner Cable'] + label is: + ['Time Warner Cable'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 63.37505001652675, Em score: 48.888888888888886, current_count: 1080 +2024-07-30 14:11:47,271 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:47,271 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 245, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:47,272 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:47,272 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:47,272 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:48,217 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:48,250 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:48,282 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:48,313 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:48,344 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:48,375 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:48,407 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:48,438 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:48,469 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:48,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:48,534 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2615554332733154 s; generated tokens: 11 tokens; generate speed: 8.719394891319734 tokens/s +2024-07-30 14:11:48,539 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:48,539 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1081/2067], cost time 1.2731s, every example cost time is 1.2731, generate speed: 8.6405 tokens/s, avg speed: 10.3315 tokens/s, remaining time: 0:22:28 +pred is: + ['2000'] + label is: + ['2000'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:48,620 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:48,621 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 237, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:48,621 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:48,621 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:48,621 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:49,565 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:49,599 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:49,644 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:49,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:49,708 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:49,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:49,771 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:49,803 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:49,835 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:49,838 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2167675495147705 s; generated tokens: 9 tokens; generate speed: 7.396646963168167 tokens/s +2024-07-30 14:11:49,843 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:49,844 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1082/2067], cost time 1.2279s, every example cost time is 1.2279, generate speed: 7.3293 tokens/s, avg speed: 10.3290 tokens/s, remaining time: 0:22:27 +pred is: + ['1999'] + label is: + ['August 1999'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:11:49,926 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:49,927 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 377, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:49,927 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:49,928 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:49,928 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:50,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:50,908 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:50,939 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:50,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:51,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:51,033 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:51,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:51,096 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:51,127 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:51,158 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:51,348 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4202616214752197 s; generated tokens: 16 tokens; generate speed: 11.265530067186402 tokens/s +2024-07-30 14:11:51,353 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:51,353 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1083/2067], cost time 1.4319s, every example cost time is 1.4319, generate speed: 11.1740 tokens/s, avg speed: 10.3298 tokens/s, remaining time: 0:22:26 +pred is: + ['July 31, 1995'] + label is: + ['July 31, 1995'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:51,436 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:51,436 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 191, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:51,437 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:51,437 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:51,437 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:52,380 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:52,414 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:52,468 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:52,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:52,531 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:52,562 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:52,593 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:52,624 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:52,655 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:52,686 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:52,996 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.55855393409729 s; generated tokens: 20 tokens; generate speed: 12.832408017746234 tokens/s +2024-07-30 14:11:53,001 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:53,001 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1084/2067], cost time 1.5702s, every example cost time is 1.5702, generate speed: 12.7376 tokens/s, avg speed: 10.3324 tokens/s, remaining time: 0:22:24 +pred is: + ['1965-66'] + label is: + ['1965–66 season'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:11:53,083 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:53,083 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 202, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:53,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:53,084 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:53,084 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:54,027 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:54,060 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:54,092 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:54,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:54,154 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:54,185 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:54,215 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:54,246 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:54,277 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:54,308 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:54,643 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5582623481750488 s; generated tokens: 20 tokens; generate speed: 12.83480924981785 tokens/s +2024-07-30 14:11:54,647 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:54,648 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1085/2067], cost time 1.5695s, every example cost time is 1.5695, generate speed: 12.7431 tokens/s, avg speed: 10.3349 tokens/s, remaining time: 0:22:23 +pred is: + ['May 1, 1953'] + label is: + ['May 1, 1953'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:54,731 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:54,731 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 296, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:54,732 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:54,732 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:54,732 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:55,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:55,709 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:55,741 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:55,772 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:55,803 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:55,835 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:55,866 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:55,897 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:55,928 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:55,959 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:56,023 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2909793853759766 s; generated tokens: 12 tokens; generate speed: 9.295268488354054 tokens/s +2024-07-30 14:11:56,028 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:56,028 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1086/2067], cost time 1.3022s, every example cost time is 1.3022, generate speed: 9.2148 tokens/s, avg speed: 10.3340 tokens/s, remaining time: 0:22:22 +pred is: + ['Robert Kintner'] + label is: + ['Robert Kintner'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:56,110 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:56,111 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 235, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:56,111 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:56,111 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:56,112 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:57,056 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:57,090 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:57,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:57,156 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:57,189 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:57,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:57,252 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:57,284 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:57,315 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:57,347 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:57,662 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5501506328582764 s; generated tokens: 20 tokens; generate speed: 12.901971960700747 tokens/s +2024-07-30 14:11:57,667 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:57,667 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1087/2067], cost time 1.5615s, every example cost time is 1.5615, generate speed: 12.8084 tokens/s, avg speed: 10.3366 tokens/s, remaining time: 0:22:21 +pred is: + ['Paramount Pictures'] + label is: + ['Paramount Pictures'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:57,749 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:57,750 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 225, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:57,750 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:57,750 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:57,751 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:11:58,694 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:58,727 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:58,759 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:58,791 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:58,822 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:58,855 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:58,886 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:58,918 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:58,949 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:58,981 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:59,015 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2639529705047607 s; generated tokens: 11 tokens; generate speed: 8.702855451660627 tokens/s +2024-07-30 14:11:59,020 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:11:59,020 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1088/2067], cost time 1.2752s, every example cost time is 1.2752, generate speed: 8.6259 tokens/s, avg speed: 10.3351 tokens/s, remaining time: 0:22:19 +pred is: + ['Cheyenne'] + label is: + ['Cheyenne'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:11:59,127 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:11:59,127 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 179, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:11:59,128 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:11:59,128 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:11:59,128 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:00,071 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:00,104 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:00,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:00,140 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.011864423751831 s; generated tokens: 3 tokens; generate speed: 2.9648240708735276 tokens/s +2024-07-30 14:12:00,145 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:00,145 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1089/2067], cost time 1.0236s, every example cost time is 1.0236, generate speed: 2.9309 tokens/s, avg speed: 10.3300 tokens/s, remaining time: 0:22:17 +pred is: + ['Roy'] + label is: + ['Roy'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:00,228 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:00,228 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:00,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:00,229 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:00,229 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:01,173 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:01,206 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:01,237 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:01,269 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:01,300 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:01,332 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:01,363 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:01,395 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:01,426 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:01,458 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:01,788 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.558927297592163 s; generated tokens: 20 tokens; generate speed: 12.829334652674916 tokens/s +2024-07-30 14:12:01,793 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:01,793 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1090/2067], cost time 1.5705s, every example cost time is 1.5705, generate speed: 12.7350 tokens/s, avg speed: 10.3325 tokens/s, remaining time: 0:22:16 +pred is: + ['Allen Shaw'] + label is: + ['Allen Shaw'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 63.57344405307237, Em score: 49.174311926605505, current_count: 1090 +2024-07-30 14:12:02,185 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:02,185 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 193, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:02,186 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:02,186 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:02,186 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:03,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:03,163 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:03,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:03,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:03,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:03,290 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:03,321 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:03,352 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:03,384 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:03,386 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2001869678497314 s; generated tokens: 9 tokens; generate speed: 7.498831632978403 tokens/s +2024-07-30 14:12:03,391 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:03,391 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1091/2067], cost time 1.2116s, every example cost time is 1.2116, generate speed: 7.4283 tokens/s, avg speed: 10.3302 tokens/s, remaining time: 0:22:15 +pred is: + ['1969'] + label is: + ['1969'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:03,474 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:03,475 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 156, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:03,475 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:03,475 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:03,475 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:04,418 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:04,451 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:04,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:04,513 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:04,544 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:04,575 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:04,605 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:04,636 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:04,667 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:04,697 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:05,006 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5305709838867188 s; generated tokens: 20 tokens; generate speed: 13.067018916830746 tokens/s +2024-07-30 14:12:05,011 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:05,011 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1092/2067], cost time 1.5419s, every example cost time is 1.5419, generate speed: 12.9707 tokens/s, avg speed: 10.3329 tokens/s, remaining time: 0:22:13 +pred is: + ['1970s'] + label is: + ['early 1970s'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:12:05,093 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:05,094 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 225, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:05,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:05,094 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:05,095 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:06,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:06,071 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:06,103 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:06,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:06,165 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:06,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:06,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:06,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:06,289 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:06,320 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:06,355 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.259972333908081 s; generated tokens: 11 tokens; generate speed: 8.730350424347083 tokens/s +2024-07-30 14:12:06,360 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:06,360 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1093/2067], cost time 1.2714s, every example cost time is 1.2714, generate speed: 8.6520 tokens/s, avg speed: 10.3315 tokens/s, remaining time: 0:22:12 +pred is: + ['Monday Night Football'] + label is: + ['Monday Night Football'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:06,442 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:06,442 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 170, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:06,443 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:06,443 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:06,443 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:07,386 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:07,419 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:07,450 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:07,481 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:07,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:07,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:07,574 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:07,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:07,637 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:07,668 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:07,702 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2585651874542236 s; generated tokens: 11 tokens; generate speed: 8.740111445677574 tokens/s +2024-07-30 14:12:07,707 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:07,707 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1094/2067], cost time 1.2699s, every example cost time is 1.2699, generate speed: 8.6624 tokens/s, avg speed: 10.3301 tokens/s, remaining time: 0:22:11 +pred is: + ['1970'] + label is: + ['1970'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:07,789 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:07,789 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 165, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:07,790 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:07,790 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:07,790 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:08,733 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:08,767 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:08,799 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:08,831 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:08,863 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:08,894 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:08,925 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:08,956 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:08,987 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:09,018 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:09,051 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2610585689544678 s; generated tokens: 11 tokens; generate speed: 8.722830382985304 tokens/s +2024-07-30 14:12:09,056 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:09,056 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1095/2067], cost time 1.2722s, every example cost time is 1.2722, generate speed: 8.6463 tokens/s, avg speed: 10.3286 tokens/s, remaining time: 0:22:09 +pred is: + ['Cigarette advertising on television and radio networks'] + label is: + ['cigarette advertising from all television and radio networks'] +The F1/Em of this example is: {'F1': 57.14285714285715, 'Em': 0.0} +2024-07-30 14:12:09,139 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:09,140 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 227, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:09,140 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:09,140 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:09,141 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:10,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:10,117 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:10,149 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:10,180 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:10,212 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:10,243 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:10,274 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:10,305 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:10,335 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:10,367 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:10,678 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5372779369354248 s; generated tokens: 20 tokens; generate speed: 13.010009133332227 tokens/s +2024-07-30 14:12:10,683 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:10,683 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1096/2067], cost time 1.5485s, every example cost time is 1.5485, generate speed: 12.9159 tokens/s, avg speed: 10.3313 tokens/s, remaining time: 0:22:08 +pred is: + ['1966'] + label is: + ['1966'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:10,765 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:10,765 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 333, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:10,765 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:10,766 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:10,766 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:11,711 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:11,746 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:11,778 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:11,809 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:11,841 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:11,872 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:11,903 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:11,934 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:11,965 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:12,006 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:12,320 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5535500049591064 s; generated tokens: 20 tokens; generate speed: 12.87374074613482 tokens/s +2024-07-30 14:12:12,324 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:12,325 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1097/2067], cost time 1.5647s, every example cost time is 1.5647, generate speed: 12.7823 tokens/s, avg speed: 10.3339 tokens/s, remaining time: 0:22:07 +pred is: + ['Fred Pierce'] + label is: + ['Fred Pierce'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:12,407 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:12,408 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 223, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:12,408 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:12,408 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:12,408 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:13,352 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:13,386 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:13,419 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:13,451 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:13,483 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:13,514 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:13,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:13,576 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:13,607 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:13,638 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:13,959 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5507705211639404 s; generated tokens: 20 tokens; generate speed: 12.896814665388968 tokens/s +2024-07-30 14:12:13,966 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:13,966 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1098/2067], cost time 1.5634s, every example cost time is 1.5634, generate speed: 12.7922 tokens/s, avg speed: 10.3364 tokens/s, remaining time: 0:22:06 +pred is: + ['2'] + label is: + ["president of NBC's entertainment division"] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:12:14,049 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:14,049 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 270, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:14,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:14,050 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:14,050 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:14,995 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:15,028 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:15,060 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:15,091 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:15,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:15,154 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:15,185 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:15,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:15,225 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1745095252990723 s; generated tokens: 8 tokens; generate speed: 6.81135386957625 tokens/s +2024-07-30 14:12:15,230 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:15,230 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1099/2067], cost time 1.1856s, every example cost time is 1.1856, generate speed: 6.7476 tokens/s, avg speed: 10.3336 tokens/s, remaining time: 0:22:04 +pred is: + ['Alex Haley'] + label is: + ['Alex Haley'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:15,312 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:15,312 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 249, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:15,313 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:15,313 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:15,313 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:16,257 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:16,291 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:16,323 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:16,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:16,385 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:16,416 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:16,446 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:16,477 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:16,508 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:16,539 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:16,548 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2343122959136963 s; generated tokens: 10 tokens; generate speed: 8.101677373794228 tokens/s +2024-07-30 14:12:16,553 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:16,553 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1100/2067], cost time 1.2458s, every example cost time is 1.2458, generate speed: 8.0270 tokens/s, avg speed: 10.3317 tokens/s, remaining time: 0:22:03 +pred is: + ['Roone Arledge'] + label is: + ['Roone Arledge'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 63.72926988635613, Em score: 49.36363636363637, current_count: 1100 +2024-07-30 14:12:16,946 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:16,947 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 203, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:16,947 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:16,948 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:16,948 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:17,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:17,925 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:17,961 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:17,992 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:17,995 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0472743511199951 s; generated tokens: 4 tokens; generate speed: 3.8194385222193663 tokens/s +2024-07-30 14:12:18,000 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:18,000 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1101/2067], cost time 1.0590s, every example cost time is 1.0590, generate speed: 3.7773 tokens/s, avg speed: 10.3271 tokens/s, remaining time: 0:22:01 +pred is: + ['1978'] + label is: + ['June 1978'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:12:18,082 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:18,082 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 320, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:18,083 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:18,083 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:18,083 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:19,028 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:19,062 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:19,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:19,124 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:19,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:19,186 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:19,217 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:19,247 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:19,279 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:19,309 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:19,637 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5539638996124268 s; generated tokens: 20 tokens; generate speed: 12.870311855370764 tokens/s +2024-07-30 14:12:19,642 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:19,643 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1102/2067], cost time 1.5655s, every example cost time is 1.5655, generate speed: 12.7755 tokens/s, avg speed: 10.3296 tokens/s, remaining time: 0:22:00 +pred is: + ['24'] + label is: + ['ABC Cable News'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:12:19,732 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:19,733 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 305, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:19,733 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:19,734 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:19,734 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:20,680 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:20,713 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:20,745 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:20,777 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:20,809 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:20,840 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:20,871 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:20,902 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:20,933 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:20,964 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:21,276 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.542344093322754 s; generated tokens: 20 tokens; generate speed: 12.967274998222308 tokens/s +2024-07-30 14:12:21,281 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:21,282 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1103/2067], cost time 1.5563s, every example cost time is 1.5563, generate speed: 12.8507 tokens/s, avg speed: 10.3322 tokens/s, remaining time: 0:21:58 +pred is: + ['1'] + label is: + ['Writers Guild of America'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:12:21,371 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:21,372 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 182, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:21,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:21,373 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:21,373 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:22,316 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:22,348 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:22,381 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:22,412 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:22,443 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:22,474 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:22,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:22,535 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:22,538 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1651787757873535 s; generated tokens: 8 tokens; generate speed: 6.865899178942828 tokens/s +2024-07-30 14:12:22,543 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:22,543 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1104/2067], cost time 1.1768s, every example cost time is 1.1768, generate speed: 6.7978 tokens/s, avg speed: 10.3295 tokens/s, remaining time: 0:21:57 +pred is: + ['ABC Entertainment'] + label is: + ['ABC Entertainment'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:22,627 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:22,627 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 215, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:22,627 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:22,628 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:22,628 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:23,572 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:23,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:23,638 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:23,670 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:23,702 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:23,705 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0772545337677002 s; generated tokens: 5 tokens; generate speed: 4.641428597670867 tokens/s +2024-07-30 14:12:23,710 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:23,710 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1105/2067], cost time 1.0885s, every example cost time is 1.0885, generate speed: 4.5933 tokens/s, avg speed: 10.3253 tokens/s, remaining time: 0:21:55 +pred is: + ['2010'] + label is: + ['2010'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:23,802 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:23,803 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 237, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:23,803 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:23,803 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:23,804 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:24,748 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:24,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:24,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:24,844 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:24,875 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:24,906 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:24,937 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:24,968 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:24,998 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:25,030 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:25,063 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2590548992156982 s; generated tokens: 11 tokens; generate speed: 8.736711962959056 tokens/s +2024-07-30 14:12:25,068 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:25,068 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1106/2067], cost time 1.2708s, every example cost time is 1.2708, generate speed: 8.6559 tokens/s, avg speed: 10.3239 tokens/s, remaining time: 0:21:54 +pred is: + ['1970'] + label is: + ['1970'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:25,150 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:25,151 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 152, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:25,151 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:25,151 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:25,152 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:26,095 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:26,128 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:26,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:26,189 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:26,220 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:26,251 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:26,281 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:26,312 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:26,342 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:26,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:26,472 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3202464580535889 s; generated tokens: 13 tokens; generate speed: 9.8466463747728 tokens/s +2024-07-30 14:12:26,477 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:26,477 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1107/2067], cost time 1.3316s, every example cost time is 1.3316, generate speed: 9.7630 tokens/s, avg speed: 10.3234 tokens/s, remaining time: 0:21:52 +pred is: + ['Disney–ABC Domestic Television'] + label is: + ['Disney–ABC Domestic Television'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:26,560 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:26,560 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 187, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:26,561 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:26,561 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:26,561 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:27,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:27,538 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:27,569 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:27,600 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:27,631 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:27,662 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:27,692 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:27,723 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:27,754 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:27,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:27,941 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.379516363143921 s; generated tokens: 15 tokens; generate speed: 10.873375916915524 tokens/s +2024-07-30 14:12:27,946 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:27,946 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1108/2067], cost time 1.3907s, every example cost time is 1.3907, generate speed: 10.7857 tokens/s, avg speed: 10.3239 tokens/s, remaining time: 0:21:51 +pred is: + ['WABC-TV and WPVI-TV'] + label is: + ['WABC-TV and WPVI-TV'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:28,028 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:28,029 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 201, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:28,029 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:28,030 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:28,030 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:28,974 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:29,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:29,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:29,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:29,072 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0421626567840576 s; generated tokens: 4 tokens; generate speed: 3.838172452219063 tokens/s +2024-07-30 14:12:29,077 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:29,077 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1109/2067], cost time 1.0540s, every example cost time is 1.0540, generate speed: 3.7952 tokens/s, avg speed: 10.3193 tokens/s, remaining time: 0:21:49 +pred is: + ['1946'] + label is: + ['1946'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:29,160 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:29,160 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 236, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:29,160 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:29,161 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:29,161 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:30,105 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:30,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:30,170 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:30,201 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:30,232 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:30,263 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:30,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:30,326 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:30,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:30,388 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:30,701 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5400276184082031 s; generated tokens: 20 tokens; generate speed: 12.986780081692507 tokens/s +2024-07-30 14:12:30,706 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:30,706 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1110/2067], cost time 1.5513s, every example cost time is 1.5513, generate speed: 12.8923 tokens/s, avg speed: 10.3219 tokens/s, remaining time: 0:21:48 +pred is: + ['2011'] + label is: + ['2011'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 63.83080799548806, Em score: 49.549549549549546, current_count: 1110 +2024-07-30 14:12:31,103 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:31,104 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 165, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:31,104 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:31,104 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:31,105 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:32,056 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:32,088 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:32,119 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:32,150 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:32,181 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:32,212 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:32,243 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:32,273 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:32,304 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:32,335 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:32,644 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5390567779541016 s; generated tokens: 20 tokens; generate speed: 12.994972171583164 tokens/s +2024-07-30 14:12:32,649 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:32,649 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1111/2067], cost time 1.5508s, every example cost time is 1.5508, generate speed: 12.8966 tokens/s, avg speed: 10.3246 tokens/s, remaining time: 0:21:47 +pred is: + ['720p'] + label is: + ['720p high definition'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +2024-07-30 14:12:32,731 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:32,731 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 210, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:32,732 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:32,732 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:32,732 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:33,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:33,708 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:33,740 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:33,771 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:33,801 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:33,804 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0712180137634277 s; generated tokens: 5 tokens; generate speed: 4.667583942538349 tokens/s +2024-07-30 14:12:33,808 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:33,809 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1112/2067], cost time 1.0823s, every example cost time is 1.0823, generate speed: 4.6197 tokens/s, avg speed: 10.3205 tokens/s, remaining time: 0:21:45 +pred is: + ['Body of Proof'] + label is: + ['Body of Proof'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:33,891 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:33,891 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 242, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:33,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:33,892 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:33,892 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:34,836 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:34,869 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:34,900 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:34,931 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:34,962 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:34,992 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:35,023 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:35,054 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:35,085 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:35,115 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:35,301 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4085114002227783 s; generated tokens: 16 tokens; generate speed: 11.359510471458979 tokens/s +2024-07-30 14:12:35,305 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:35,306 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1113/2067], cost time 1.4197s, every example cost time is 1.4197, generate speed: 11.2704 tokens/s, avg speed: 10.3214 tokens/s, remaining time: 0:21:44 +pred is: + ['All My Children and One Life to Live'] + label is: + ['All My Children and One Life to Live'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:35,396 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:35,397 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 214, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:35,397 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:35,397 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:35,397 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:36,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:36,374 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:36,405 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:36,437 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:36,467 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:36,499 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:36,529 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:36,560 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:36,591 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:36,621 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:36,655 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.257005214691162 s; generated tokens: 11 tokens; generate speed: 8.750958127649954 tokens/s +2024-07-30 14:12:36,660 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:36,660 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1114/2067], cost time 1.2687s, every example cost time is 1.2687, generate speed: 8.6705 tokens/s, avg speed: 10.3200 tokens/s, remaining time: 0:21:43 +pred is: + ['2004'] + label is: + ['2004'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:36,742 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:36,743 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 219, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:36,743 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:36,743 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:36,744 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:37,688 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:37,721 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:37,752 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:37,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:37,813 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:37,844 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:37,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:37,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:37,937 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:37,968 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:38,032 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2885746955871582 s; generated tokens: 12 tokens; generate speed: 9.312614969931582 tokens/s +2024-07-30 14:12:38,037 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:38,038 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1115/2067], cost time 1.2998s, every example cost time is 1.2998, generate speed: 9.2319 tokens/s, avg speed: 10.3191 tokens/s, remaining time: 0:21:41 +pred is: + ['The Middle and Modern Family'] + label is: + ['The Middle and Modern Family'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:38,121 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:38,121 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 172, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:38,121 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:38,122 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:38,122 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:39,065 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:39,098 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:39,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:39,160 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:39,190 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:39,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:39,251 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:39,282 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:39,313 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:39,316 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.193683385848999 s; generated tokens: 9 tokens; generate speed: 7.53968774860581 tokens/s +2024-07-30 14:12:39,320 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:39,321 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1116/2067], cost time 1.2050s, every example cost time is 1.2050, generate speed: 7.4687 tokens/s, avg speed: 10.3168 tokens/s, remaining time: 0:21:40 +pred is: + ['Thomas Murphy'] + label is: + ['Daniel Burke'] +The F1/Em of this example is: {'F1': 33.33333333333333, 'Em': 0.0} +2024-07-30 14:12:39,405 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:39,406 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 157, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:39,406 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:39,407 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:39,407 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:40,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:40,384 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:40,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:40,446 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:40,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:40,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:40,549 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:40,580 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:40,611 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:40,642 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:40,951 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5440945625305176 s; generated tokens: 20 tokens; generate speed: 12.952574593115127 tokens/s +2024-07-30 14:12:40,957 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:40,957 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1117/2067], cost time 1.5567s, every example cost time is 1.5567, generate speed: 12.8480 tokens/s, avg speed: 10.3194 tokens/s, remaining time: 0:21:39 +pred is: + ['1993'] + label is: + ['1993'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:41,041 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:41,042 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 251, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:41,042 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:41,043 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:41,043 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:41,988 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:42,021 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:42,052 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:42,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:42,114 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:42,145 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:42,176 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:42,206 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:42,237 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:42,268 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:42,271 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.227614402770996 s; generated tokens: 10 tokens; generate speed: 8.14588031667582 tokens/s +2024-07-30 14:12:42,275 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:42,276 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1118/2067], cost time 1.2399s, every example cost time is 1.2399, generate speed: 8.0655 tokens/s, avg speed: 10.3176 tokens/s, remaining time: 0:21:37 +pred is: + ['WLS'] + label is: + ['WLS'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:42,358 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:42,358 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 202, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:42,358 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:42,358 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:42,359 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:43,303 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:43,336 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:43,367 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:43,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:43,429 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:43,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:43,491 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:43,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:43,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:43,583 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:43,586 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2266838550567627 s; generated tokens: 10 tokens; generate speed: 8.15205968414516 tokens/s +2024-07-30 14:12:43,591 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:43,591 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1119/2067], cost time 1.2383s, every example cost time is 1.2383, generate speed: 8.0756 tokens/s, avg speed: 10.3158 tokens/s, remaining time: 0:21:36 +pred is: + ['Wide World of Sports'] + label is: + ['Wide World of Sports'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:43,674 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:43,674 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 287, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:43,675 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:43,675 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:43,675 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:44,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:44,654 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:44,685 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:44,717 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:44,748 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:44,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:44,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:44,842 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:44,873 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:44,904 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:45,219 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5433320999145508 s; generated tokens: 20 tokens; generate speed: 12.958973639638113 tokens/s +2024-07-30 14:12:45,224 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:45,224 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1120/2067], cost time 1.5549s, every example cost time is 1.5549, generate speed: 12.8622 tokens/s, avg speed: 10.3184 tokens/s, remaining time: 0:21:34 +pred is: + ['American Broadcasting Companies'] + label is: + ['American Broadcasting Companies'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.03469959076644, Em score: 49.82142857142857, current_count: 1120 +2024-07-30 14:12:45,626 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:45,626 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 273, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:45,627 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:45,627 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:45,627 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:46,572 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:46,605 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:46,636 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:46,667 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:46,699 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:46,730 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:46,761 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:46,792 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:46,823 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:46,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:46,857 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2298071384429932 s; generated tokens: 10 tokens; generate speed: 8.131356281327637 tokens/s +2024-07-30 14:12:46,862 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:46,862 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1121/2067], cost time 1.2415s, every example cost time is 1.2415, generate speed: 8.0548 tokens/s, avg speed: 10.3165 tokens/s, remaining time: 0:21:33 +pred is: + ['90'] + label is: + ['90%'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:12:46,946 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:46,946 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 267, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:46,946 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:46,947 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:46,947 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:47,891 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:47,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:47,955 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:47,991 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:48,022 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:48,053 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:48,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:48,115 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:48,146 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:48,177 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:48,272 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3254404067993164 s; generated tokens: 13 tokens; generate speed: 9.808060727069956 tokens/s +2024-07-30 14:12:48,277 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:48,277 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1122/2067], cost time 1.3368s, every example cost time is 1.3368, generate speed: 9.7245 tokens/s, avg speed: 10.3160 tokens/s, remaining time: 0:21:32 +pred is: + ['Infinity Broadcasting Corporation'] + label is: + ['Infinity Broadcasting Corporation'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:48,360 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:48,361 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 306, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:48,361 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:48,361 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:48,361 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:49,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:49,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:49,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:49,404 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:49,436 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:49,468 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:49,471 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1094341278076172 s; generated tokens: 6 tokens; generate speed: 5.408162458330683 tokens/s +2024-07-30 14:12:49,476 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:49,476 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1123/2067], cost time 1.1206s, every example cost time is 1.1206, generate speed: 5.3543 tokens/s, avg speed: 10.3124 tokens/s, remaining time: 0:21:30 +pred is: + ['Daniel B. Burke'] + label is: + ['Daniel B. Burke'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:49,559 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:49,559 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 235, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:49,560 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:49,560 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:49,560 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:50,504 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:50,537 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:50,569 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:50,601 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:50,604 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.044130563735962 s; generated tokens: 4 tokens; generate speed: 3.8309385233277338 tokens/s +2024-07-30 14:12:50,609 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:50,609 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1124/2067], cost time 1.0559s, every example cost time is 1.0559, generate speed: 3.7884 tokens/s, avg speed: 10.3079 tokens/s, remaining time: 0:21:28 +pred is: + ['General Hospital'] + label is: + ['General Hospital'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:50,694 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:50,694 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 217, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:50,695 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:50,695 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:50,695 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:51,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:51,673 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:51,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:51,737 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:51,769 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:51,801 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:51,832 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:51,864 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:51,896 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:51,928 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:52,242 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5468511581420898 s; generated tokens: 20 tokens; generate speed: 12.929492210499319 tokens/s +2024-07-30 14:12:52,247 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:52,248 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1125/2067], cost time 1.5589s, every example cost time is 1.5589, generate speed: 12.8294 tokens/s, avg speed: 10.3105 tokens/s, remaining time: 0:21:27 +pred is: + ['New Jersey, Rhode Island and Delaware'] + label is: + ['New Jersey, Rhode Island and Delaware'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:52,330 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:52,330 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 190, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:52,331 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:52,331 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:52,331 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:53,274 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:53,306 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:53,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:53,370 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:53,401 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:53,432 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:53,464 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:53,495 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:53,527 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:53,558 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:53,561 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2302477359771729 s; generated tokens: 10 tokens; generate speed: 8.12844413979523 tokens/s +2024-07-30 14:12:53,566 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:53,567 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1126/2067], cost time 1.2414s, every example cost time is 1.2414, generate speed: 8.0551 tokens/s, avg speed: 10.3086 tokens/s, remaining time: 0:21:26 +pred is: + ['ABC Circle Films'] + label is: + ['ABC Circle Films'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:53,649 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:53,650 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 184, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:53,650 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:53,650 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:53,650 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:54,594 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:54,627 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:54,658 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:54,690 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:54,721 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:54,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:54,784 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:54,815 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:54,846 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:54,850 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1989281177520752 s; generated tokens: 9 tokens; generate speed: 7.506705253417953 tokens/s +2024-07-30 14:12:54,854 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:54,855 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1127/2067], cost time 1.2101s, every example cost time is 1.2101, generate speed: 7.4374 tokens/s, avg speed: 10.3064 tokens/s, remaining time: 0:21:24 +pred is: + ['Times Square Studios'] + label is: + ['Times Square Studios'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:54,938 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:54,938 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 193, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:54,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:54,938 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:54,939 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:55,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:55,916 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:55,951 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:55,983 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:56,015 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:56,046 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:56,078 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:56,109 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:56,140 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:56,172 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:56,489 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5502991676330566 s; generated tokens: 20 tokens; generate speed: 12.900735817677894 tokens/s +2024-07-30 14:12:56,494 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:56,494 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1128/2067], cost time 1.5616s, every example cost time is 1.5616, generate speed: 12.8070 tokens/s, avg speed: 10.3089 tokens/s, remaining time: 0:21:23 +pred is: + ['ABC on Demand'] + label is: + ['ABC on Demand'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:12:56,577 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:56,577 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:56,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:56,578 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:56,578 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:57,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:57,555 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:57,587 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:57,619 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:57,650 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:57,681 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:57,713 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:57,745 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:57,776 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:57,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:58,121 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.542921781539917 s; generated tokens: 20 tokens; generate speed: 12.96241989664502 tokens/s +2024-07-30 14:12:58,126 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:58,126 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1129/2067], cost time 1.5543s, every example cost time is 1.5543, generate speed: 12.8679 tokens/s, avg speed: 10.3115 tokens/s, remaining time: 0:21:22 +pred is: + ['1'] + label is: + ['the day after their original broadcast'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:12:58,209 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:58,209 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 282, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:58,209 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:58,209 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:58,210 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:12:59,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:59,188 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:59,219 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:59,251 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:59,286 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:59,323 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:59,355 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:59,386 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:59,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:59,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:59,494 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.28371262550354 s; generated tokens: 11 tokens; generate speed: 8.568896014156765 tokens/s +2024-07-30 14:12:59,498 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:12:59,499 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1130/2067], cost time 1.2950s, every example cost time is 1.2950, generate speed: 8.4940 tokens/s, avg speed: 10.3100 tokens/s, remaining time: 0:21:20 +pred is: + ['LoyalKaspar'] + label is: + ['LoyalKaspar'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.17598543509594, Em score: 50.08849557522124, current_count: 1130 +2024-07-30 14:12:59,936 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:12:59,937 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 298, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:12:59,937 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:12:59,938 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:12:59,938 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:00,884 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:00,917 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:00,949 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:00,980 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:01,012 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:01,044 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:01,075 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:01,106 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:01,137 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:01,140 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.202606439590454 s; generated tokens: 9 tokens; generate speed: 7.483745058828171 tokens/s +2024-07-30 14:13:01,145 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:01,146 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1131/2067], cost time 1.2145s, every example cost time is 1.2145, generate speed: 7.4102 tokens/s, avg speed: 10.3077 tokens/s, remaining time: 0:21:19 +pred is: + ['14'] + label is: + ['14'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:13:01,228 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:01,228 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 282, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:01,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:01,229 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:01,229 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:02,174 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:02,207 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:02,239 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:02,270 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:02,302 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:02,333 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:02,365 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:02,420 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:02,451 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:02,483 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:02,518 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2884702682495117 s; generated tokens: 11 tokens; generate speed: 8.537255589874313 tokens/s +2024-07-30 14:13:02,523 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:02,523 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1132/2067], cost time 1.2998s, every example cost time is 1.2998, generate speed: 8.4626 tokens/s, avg speed: 10.3061 tokens/s, remaining time: 0:21:17 +pred is: + ['Youngstown'] + label is: + ['Youngstown'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:13:02,605 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:02,605 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 211, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:02,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:02,606 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:02,606 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:03,550 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:03,583 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:03,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:03,647 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:03,678 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:03,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:03,741 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:03,773 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:03,804 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:03,836 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:04,151 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5442640781402588 s; generated tokens: 20 tokens; generate speed: 12.951152774391923 tokens/s +2024-07-30 14:13:04,156 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:04,156 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1133/2067], cost time 1.5556s, every example cost time is 1.5556, generate speed: 12.8571 tokens/s, avg speed: 10.3087 tokens/s, remaining time: 0:21:16 +pred is: + ['Walt Disney Presents'] + label is: + ['Walt Disney Presents'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:13:04,238 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:04,239 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 307, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:04,239 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:04,239 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:04,240 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:05,184 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:05,217 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:05,248 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:05,280 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:05,311 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:05,342 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:05,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:05,404 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:05,434 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:05,465 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:05,560 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.320115089416504 s; generated tokens: 13 tokens; generate speed: 9.847626244273938 tokens/s +2024-07-30 14:13:05,565 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:05,565 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1134/2067], cost time 1.3313s, every example cost time is 1.3313, generate speed: 9.7648 tokens/s, avg speed: 10.3082 tokens/s, remaining time: 0:21:15 +pred is: + ['The ABC Sunday Night Movie'] + label is: + ['ABC Sunday Night Movie'] +The F1/Em of this example is: {'F1': 87.50000000000001, 'Em': 0.0} +2024-07-30 14:13:05,648 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:05,648 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 239, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:05,648 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:05,649 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:05,649 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:06,593 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:06,626 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:06,659 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:06,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:06,722 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:06,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:06,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:06,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:06,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:06,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:06,881 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2322776317596436 s; generated tokens: 10 tokens; generate speed: 8.115054385690987 tokens/s +2024-07-30 14:13:06,886 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:06,886 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1135/2067], cost time 1.2435s, every example cost time is 1.2435, generate speed: 8.0415 tokens/s, avg speed: 10.3064 tokens/s, remaining time: 0:21:13 +pred is: + ['ITT'] + label is: + ['ITT'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:13:06,969 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:06,969 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 380, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:06,969 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:06,970 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:06,970 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:07,917 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:07,950 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:07,982 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:08,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:08,044 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:08,075 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:08,106 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:08,137 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:08,169 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:08,200 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:08,534 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5636851787567139 s; generated tokens: 20 tokens; generate speed: 12.790298374447726 tokens/s +2024-07-30 14:13:08,538 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:08,539 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1136/2067], cost time 1.5751s, every example cost time is 1.5751, generate speed: 12.6979 tokens/s, avg speed: 10.3089 tokens/s, remaining time: 0:21:12 +pred is: + ['Capital Cities Communications'] + label is: + ['Capital Cities Communications'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:13:08,622 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:08,622 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 333, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:08,622 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:08,623 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:08,623 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:09,568 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:09,602 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:09,634 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:09,668 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:09,699 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:09,730 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:09,761 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:09,792 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:09,823 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:09,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:10,043 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4196627140045166 s; generated tokens: 16 tokens; generate speed: 11.270282611612702 tokens/s +2024-07-30 14:13:10,048 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:10,048 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1137/2067], cost time 1.4310s, every example cost time is 1.4310, generate speed: 11.1813 tokens/s, avg speed: 10.3097 tokens/s, remaining time: 0:21:11 +pred is: + ['September 5, 1985'] + label is: + ['September 5, 1985'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:13:10,130 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:10,130 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 228, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:10,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:10,131 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:10,131 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:11,075 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:11,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:11,140 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:11,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:11,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:11,233 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:11,264 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:11,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:11,326 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:11,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:11,636 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5042505264282227 s; generated tokens: 19 tokens; generate speed: 12.630874755360512 tokens/s +2024-07-30 14:13:11,641 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:11,641 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1138/2067], cost time 1.5156s, every example cost time is 1.5156, generate speed: 12.5366 tokens/s, avg speed: 10.3118 tokens/s, remaining time: 0:21:10 +pred is: + ['1'] + label is: + ['Laverne & Shirley'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:13:11,723 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:11,723 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 217, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:11,724 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:11,724 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:11,724 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:12,669 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:12,702 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:12,758 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:12,790 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:12,821 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:12,852 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:12,884 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:12,914 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:12,945 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:12,948 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.223642349243164 s; generated tokens: 9 tokens; generate speed: 7.355090321585059 tokens/s +2024-07-30 14:13:12,953 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:12,953 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1139/2067], cost time 1.2349s, every example cost time is 1.2349, generate speed: 7.2883 tokens/s, avg speed: 10.3094 tokens/s, remaining time: 0:21:08 +pred is: + ['TGIF'] + label is: + ['the "TGIF" block'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 14:13:13,036 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:13,036 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 254, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:13,036 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:13,037 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:13,037 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:13,981 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:14,014 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:14,045 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:14,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:14,107 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:14,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:14,169 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:14,200 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:14,231 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:14,262 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:14,264 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.227287769317627 s; generated tokens: 10 tokens; generate speed: 8.148048281748956 tokens/s +2024-07-30 14:13:14,269 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:14,269 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1140/2067], cost time 1.2384s, every example cost time is 1.2384, generate speed: 8.0749 tokens/s, avg speed: 10.3077 tokens/s, remaining time: 0:21:07 +pred is: + ['7'] + label is: + ['seven radio stations'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 64.23803819443721, Em score: 50.175438596491226, current_count: 1140 +2024-07-30 14:13:14,675 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:14,675 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 251, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:14,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:14,676 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:14,676 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:15,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:15,653 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:15,684 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:15,715 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:15,746 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:15,777 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:15,823 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:15,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:15,885 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:15,916 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:16,225 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5487301349639893 s; generated tokens: 20 tokens; generate speed: 12.913805671163644 tokens/s +2024-07-30 14:13:16,230 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:16,230 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1141/2067], cost time 1.5602s, every example cost time is 1.5602, generate speed: 12.8190 tokens/s, avg speed: 10.3102 tokens/s, remaining time: 0:21:05 +pred is: + ['1'] + label is: + ['westerns and detective series'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:13:16,313 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:16,313 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 220, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:16,314 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:16,314 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:16,314 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:17,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:17,290 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:17,321 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:17,352 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:17,355 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.040600299835205 s; generated tokens: 4 tokens; generate speed: 3.8439350830798924 tokens/s +2024-07-30 14:13:17,360 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:17,360 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1142/2067], cost time 1.0517s, every example cost time is 1.0517, generate speed: 3.8034 tokens/s, avg speed: 10.3058 tokens/s, remaining time: 0:21:04 +pred is: + ['Counterprogramming'] + label is: + ['counterprogramming'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:13:17,442 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:17,442 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 277, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:17,442 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:17,443 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:17,443 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:18,388 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:18,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:18,453 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:18,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:18,551 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:18,582 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:18,614 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:18,644 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:18,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:18,707 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:19,021 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.577718734741211 s; generated tokens: 20 tokens; generate speed: 12.676530714633714 tokens/s +2024-07-30 14:13:19,026 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:19,026 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1143/2067], cost time 1.5890s, every example cost time is 1.5890, generate speed: 12.5868 tokens/s, avg speed: 10.3081 tokens/s, remaining time: 0:21:03 +pred is: + ['WATCH ABC'] + label is: + ['WATCH ABC'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:13:19,108 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:19,108 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 258, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:19,109 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:19,109 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:19,109 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:20,054 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:20,087 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:20,118 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:20,150 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:20,181 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:20,212 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:20,243 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:20,273 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:20,304 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:20,335 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:20,494 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3843557834625244 s; generated tokens: 15 tokens; generate speed: 10.83536485287206 tokens/s +2024-07-30 14:13:20,498 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:20,499 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1144/2067], cost time 1.3958s, every example cost time is 1.3958, generate speed: 10.7465 tokens/s, avg speed: 10.3085 tokens/s, remaining time: 0:21:01 +pred is: + ['E. W. Scripps Company'] + label is: + ['Sinclair Broadcast Group'] +The F1/Em of this example is: {'F1': 14.285714285714285, 'Em': 0.0} +2024-07-30 14:13:20,582 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:20,582 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 210, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:20,583 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:20,583 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:20,583 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:21,527 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:21,561 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:21,593 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:21,624 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:21,655 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:21,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:21,736 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:21,767 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:21,798 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:21,829 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:21,832 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2488598823547363 s; generated tokens: 10 tokens; generate speed: 8.007303414330927 tokens/s +2024-07-30 14:13:21,837 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:21,838 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1145/2067], cost time 1.2606s, every example cost time is 1.2606, generate speed: 7.9329 tokens/s, avg speed: 10.3066 tokens/s, remaining time: 0:21:00 +pred is: + ['Start Here'] + label is: + ['Start Here'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:13:21,920 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:21,920 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 268, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:21,921 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:21,921 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:21,921 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:22,866 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:22,900 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:22,931 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:22,963 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:22,995 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:23,026 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:23,058 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:23,089 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:23,121 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:23,152 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:23,374 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4529731273651123 s; generated tokens: 17 tokens; generate speed: 11.700147566272319 tokens/s +2024-07-30 14:13:23,379 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:23,379 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1146/2067], cost time 1.4645s, every example cost time is 1.4645, generate speed: 11.6078 tokens/s, avg speed: 10.3078 tokens/s, remaining time: 0:20:59 +pred is: + ['WFTS-TV and WWSB'] + label is: + ['WFTS-TV and WWSB'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:13:23,463 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:23,463 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 179, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:23,463 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:23,464 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:23,464 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:24,407 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:24,441 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:24,474 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:24,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:24,536 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:24,569 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:24,572 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1080105304718018 s; generated tokens: 6 tokens; generate speed: 5.41511098946428 tokens/s +2024-07-30 14:13:24,577 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:24,577 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1147/2067], cost time 1.1195s, every example cost time is 1.1195, generate speed: 5.3596 tokens/s, avg speed: 10.3043 tokens/s, remaining time: 0:20:57 +pred is: + ['Mongol Empire'] + label is: + ['the Mongol Empire'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:13:24,660 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:24,660 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 196, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:24,661 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:24,661 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:24,661 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:25,605 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:25,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:25,672 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:25,703 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:25,735 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:25,768 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:25,799 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:25,830 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:25,863 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:25,895 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:26,211 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.549408197402954 s; generated tokens: 20 tokens; generate speed: 12.90815424464842 tokens/s +2024-07-30 14:13:26,216 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:26,216 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1148/2067], cost time 1.5612s, every example cost time is 1.5612, generate speed: 12.8107 tokens/s, avg speed: 10.3068 tokens/s, remaining time: 0:20:56 +pred is: + ['Ögedei Khan'] + label is: + ['Ögedei Khan'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:13:26,299 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:26,299 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 226, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:26,300 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:26,300 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:26,300 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:27,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:27,277 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:27,309 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:27,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:27,374 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:27,408 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:27,440 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:27,444 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1436793804168701 s; generated tokens: 7 tokens; generate speed: 6.12059648871916 tokens/s +2024-07-30 14:13:27,449 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:27,449 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1149/2067], cost time 1.1553s, every example cost time is 1.1553, generate speed: 6.0592 tokens/s, avg speed: 10.3036 tokens/s, remaining time: 0:20:54 +pred is: + ['Delüün Boldog'] + label is: + ['Delüün Boldog'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:13:27,532 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:27,532 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 183, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:27,533 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:27,533 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:27,533 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:28,477 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:28,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:28,544 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:28,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:28,580 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0468487739562988 s; generated tokens: 4 tokens; generate speed: 3.820991244879637 tokens/s +2024-07-30 14:13:28,585 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:28,585 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1150/2067], cost time 1.0586s, every example cost time is 1.0586, generate speed: 3.7785 tokens/s, avg speed: 10.2992 tokens/s, remaining time: 0:20:53 +pred is: + ['Temülen'] + label is: + ['Temülen'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.36578196169054, Em score: 50.34782608695652, current_count: 1150 +2024-07-30 14:13:29,016 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:29,016 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 186, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:29,017 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:29,017 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:29,017 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:29,961 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:29,995 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:30,027 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:30,060 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:30,093 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:30,096 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0784976482391357 s; generated tokens: 5 tokens; generate speed: 4.636078723178957 tokens/s +2024-07-30 14:13:30,101 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:30,101 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1151/2067], cost time 1.0901s, every example cost time is 1.0901, generate speed: 4.5867 tokens/s, avg speed: 10.2953 tokens/s, remaining time: 0:20:51 +pred is: + ['Khasar'] + label is: + ['Begter'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:13:30,184 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:30,184 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 210, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:30,185 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:30,185 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:30,185 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:31,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:31,163 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:31,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:31,228 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:31,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:31,294 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:31,326 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:31,329 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1440377235412598 s; generated tokens: 7 tokens; generate speed: 6.118679354673871 tokens/s +2024-07-30 14:13:31,334 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:31,335 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1152/2067], cost time 1.1558s, every example cost time is 1.1558, generate speed: 6.0567 tokens/s, avg speed: 10.2922 tokens/s, remaining time: 0:20:49 +pred is: + ["Tayichi'ud"] + label is: + ["the Tayichi'ud"] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:13:31,418 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:31,419 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:31,419 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:31,419 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:31,420 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:32,363 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:32,397 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:32,428 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:32,461 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:32,494 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:32,525 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:32,558 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:32,590 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:32,622 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:32,654 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:32,983 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5635087490081787 s; generated tokens: 20 tokens; generate speed: 12.791741659704252 tokens/s +2024-07-30 14:13:32,988 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:32,988 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1153/2067], cost time 1.5750s, every example cost time is 1.5750, generate speed: 12.6983 tokens/s, avg speed: 10.2946 tokens/s, remaining time: 0:20:48 +pred is: + ['Marriage'] + label is: + ['arranged marriages'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:13:33,072 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:33,072 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 221, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:33,073 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:33,073 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:33,073 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:34,017 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:34,052 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:34,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:34,115 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:34,147 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:34,179 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:34,211 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:34,242 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:34,275 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:34,306 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:34,628 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.554898977279663 s; generated tokens: 20 tokens; generate speed: 12.862571969138811 tokens/s +2024-07-30 14:13:34,633 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:34,634 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1154/2067], cost time 1.5667s, every example cost time is 1.5667, generate speed: 12.7653 tokens/s, avg speed: 10.2970 tokens/s, remaining time: 0:20:47 +pred is: + ['Onggirat'] + label is: + ['the Onggirat'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:13:34,728 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:34,728 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 176, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:34,728 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:34,729 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:34,729 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:35,672 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:35,707 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:35,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:35,743 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0143189430236816 s; generated tokens: 3 tokens; generate speed: 2.9576495841209565 tokens/s +2024-07-30 14:13:35,748 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:35,748 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1155/2067], cost time 1.0261s, every example cost time is 1.0261, generate speed: 2.9238 tokens/s, avg speed: 10.2922 tokens/s, remaining time: 0:20:45 +pred is: + ['3'] + label is: + ['three'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:13:35,831 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:35,831 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 206, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:35,831 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:35,832 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:35,832 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:36,776 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:36,809 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:36,842 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:36,875 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:36,906 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:36,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:36,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:37,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:37,006 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1741971969604492 s; generated tokens: 8 tokens; generate speed: 6.813165642627118 tokens/s +2024-07-30 14:13:37,011 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:37,011 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1156/2067], cost time 1.1857s, every example cost time is 1.1857, generate speed: 6.7470 tokens/s, avg speed: 10.2896 tokens/s, remaining time: 0:20:44 +pred is: + ['A sworn brother or blood brother'] + label is: + ['sworn brother or blood brother'] +The F1/Em of this example is: {'F1': 90.0, 'Em': 0.0} +2024-07-30 14:13:37,095 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:37,095 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 338, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:37,096 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:37,096 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:37,096 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:38,042 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:38,075 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:38,107 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:38,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:38,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:38,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:38,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:38,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:38,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:38,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:38,646 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5500271320343018 s; generated tokens: 20 tokens; generate speed: 12.902999945395411 tokens/s +2024-07-30 14:13:38,651 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:38,651 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1157/2067], cost time 1.5616s, every example cost time is 1.5616, generate speed: 12.8074 tokens/s, avg speed: 10.2921 tokens/s, remaining time: 0:20:43 +pred is: + ['The traditional Mongolian aristocracy'] + label is: + ['the traditional Mongolian aristocracy'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:13:38,734 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:38,734 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 159, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:38,735 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:38,735 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:38,736 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:39,679 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:39,712 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:39,743 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:39,775 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:39,807 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:39,809 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0737144947052002 s; generated tokens: 5 tokens; generate speed: 4.656731398017313 tokens/s +2024-07-30 14:13:39,814 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:39,815 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1158/2067], cost time 1.0853s, every example cost time is 1.0853, generate speed: 4.6068 tokens/s, avg speed: 10.2881 tokens/s, remaining time: 0:20:41 +pred is: + ['Yassa code'] + label is: + ['the Yassa code'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:13:39,897 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:39,898 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:39,898 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:39,898 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:39,899 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:40,843 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:40,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:40,908 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:40,939 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:40,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:41,004 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:41,035 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:41,068 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:41,109 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:41,141 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:41,463 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5637092590332031 s; generated tokens: 20 tokens; generate speed: 12.790101410773401 tokens/s +2024-07-30 14:13:41,467 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:41,468 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1159/2067], cost time 1.5754s, every example cost time is 1.5754, generate speed: 12.6956 tokens/s, avg speed: 10.2905 tokens/s, remaining time: 0:20:40 +pred is: + ['Jochi'] + label is: + ['Jochi'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:13:41,550 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:41,550 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 220, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:41,550 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:41,551 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:41,551 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:42,495 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:42,528 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:42,560 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:42,593 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:42,624 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:42,656 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:42,689 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:42,720 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:42,751 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:42,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:43,102 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5507354736328125 s; generated tokens: 20 tokens; generate speed: 12.897106140963702 tokens/s +2024-07-30 14:13:43,107 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:43,107 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1160/2067], cost time 1.5622s, every example cost time is 1.5622, generate speed: 12.8027 tokens/s, avg speed: 10.2930 tokens/s, remaining time: 0:20:39 +pred is: + ['The Naimans'] + label is: + ['the Naimans'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.31952522064148, Em score: 50.172413793103445, current_count: 1160 +2024-07-30 14:13:43,526 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:43,526 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 186, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:43,527 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:43,527 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:43,527 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:44,471 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:44,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:44,536 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:44,570 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:44,574 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0464098453521729 s; generated tokens: 4 tokens; generate speed: 3.8225940034554875 tokens/s +2024-07-30 14:13:44,579 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:44,579 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1161/2067], cost time 1.0581s, every example cost time is 1.0581, generate speed: 3.7804 tokens/s, avg speed: 10.2887 tokens/s, remaining time: 0:20:37 +pred is: + ['friendship'] + label is: + ['his friendship'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:13:44,663 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:44,663 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 225, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:44,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:44,664 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:44,664 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:45,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:45,642 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:45,674 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:45,684 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0197715759277344 s; generated tokens: 3 tokens; generate speed: 2.941835280386942 tokens/s +2024-07-30 14:13:45,689 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:45,689 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1162/2067], cost time 1.0314s, every example cost time is 1.0314, generate speed: 2.9085 tokens/s, avg speed: 10.2839 tokens/s, remaining time: 0:20:35 +pred is: + ['Chinese'] + label is: + ['the Chinese'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:13:45,773 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:45,773 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 254, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:45,774 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:45,774 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:45,774 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:46,718 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:46,751 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:46,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:46,815 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:46,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:46,877 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:46,909 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:46,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:46,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:47,004 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:47,328 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5538489818572998 s; generated tokens: 20 tokens; generate speed: 12.871263702920604 tokens/s +2024-07-30 14:13:47,333 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:47,333 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1163/2067], cost time 1.5657s, every example cost time is 1.5657, generate speed: 12.7739 tokens/s, avg speed: 10.2863 tokens/s, remaining time: 0:20:34 +pred is: + ['1206'] + label is: + ['1206'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:13:47,417 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:47,417 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 267, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:47,418 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:47,418 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:47,418 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:48,363 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:48,395 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:48,427 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:48,458 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:48,489 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:48,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:48,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:48,583 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:48,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:48,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:48,962 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5435786247253418 s; generated tokens: 20 tokens; generate speed: 12.95690396306098 tokens/s +2024-07-30 14:13:48,967 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:48,967 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1164/2067], cost time 1.5552s, every example cost time is 1.5552, generate speed: 12.8599 tokens/s, avg speed: 10.2889 tokens/s, remaining time: 0:20:33 +pred is: + ['Jin'] + label is: + ['the Jin dynasty'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +2024-07-30 14:13:49,049 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:49,049 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 209, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:49,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:49,050 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:49,050 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:49,994 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:50,026 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:50,058 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:50,090 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:50,121 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:50,152 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:50,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:50,214 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:50,245 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:50,276 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:50,592 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5415325164794922 s; generated tokens: 20 tokens; generate speed: 12.974101931807073 tokens/s +2024-07-30 14:13:50,597 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:50,597 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1165/2067], cost time 1.5527s, every example cost time is 1.5527, generate speed: 12.8805 tokens/s, avg speed: 10.2914 tokens/s, remaining time: 0:20:32 +pred is: + ['Kuchlug'] + label is: + ['Kuchlug'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:13:50,680 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:50,680 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 203, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:50,680 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:50,681 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:50,681 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:51,624 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:51,658 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:51,690 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:51,721 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:51,752 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:51,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:51,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:51,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:51,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:51,914 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:52,227 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5456290245056152 s; generated tokens: 20 tokens; generate speed: 12.939715599865368 tokens/s +2024-07-30 14:13:52,231 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:52,232 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1166/2067], cost time 1.5569s, every example cost time is 1.5569, generate speed: 12.8462 tokens/s, avg speed: 10.2939 tokens/s, remaining time: 0:20:31 +pred is: + ['inciting internal revolt'] + label is: + ['inciting internal revolt'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:13:52,315 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:52,315 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 350, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:52,315 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:52,316 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:52,316 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:53,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:53,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:53,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:53,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:53,391 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:53,422 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:53,453 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:53,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:53,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:53,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:53,873 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.556915283203125 s; generated tokens: 20 tokens; generate speed: 12.845914107062352 tokens/s +2024-07-30 14:13:53,878 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:53,878 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1167/2067], cost time 1.5685s, every example cost time is 1.5685, generate speed: 12.7513 tokens/s, avg speed: 10.2963 tokens/s, remaining time: 0:20:29 +pred is: + ['Shah Ala ad-Din Muhammad'] + label is: + ['Shah Ala ad-Din Muhammad'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:13:53,962 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:53,962 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 186, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:53,962 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:53,963 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:53,963 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:54,906 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:54,939 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:54,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:55,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:55,035 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:55,039 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0754446983337402 s; generated tokens: 5 tokens; generate speed: 4.649239526445982 tokens/s +2024-07-30 14:13:55,043 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:55,044 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1168/2067], cost time 1.0868s, every example cost time is 1.0868, generate speed: 4.6008 tokens/s, avg speed: 10.2924 tokens/s, remaining time: 0:20:28 +pred is: + ['Tien Shan'] + label is: + ['Tien Shan'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:13:55,134 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:55,134 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 253, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:55,135 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:55,135 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:55,135 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:56,080 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:56,114 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:56,146 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:56,178 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:56,210 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:56,240 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:56,272 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:56,302 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:56,333 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:56,364 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:56,682 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.546743631362915 s; generated tokens: 20 tokens; generate speed: 12.93039104507382 tokens/s +2024-07-30 14:13:56,687 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:56,687 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1169/2067], cost time 1.5662s, every example cost time is 1.5662, generate speed: 12.7701 tokens/s, avg speed: 10.2948 tokens/s, remaining time: 0:20:27 +pred is: + ["The Shah's army was split by diverse internecine feuds and by the Shah's decision"] + label is: + ['fragmentation'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:13:56,770 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:56,770 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 174, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:56,771 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:56,771 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:56,771 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:57,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:57,748 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:57,781 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:57,812 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:57,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:57,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:57,908 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:57,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:57,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:58,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:58,321 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.549628734588623 s; generated tokens: 20 tokens; generate speed: 12.906317205914075 tokens/s +2024-07-30 14:13:58,326 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:13:58,326 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1170/2067], cost time 1.5609s, every example cost time is 1.5609, generate speed: 12.8129 tokens/s, avg speed: 10.2973 tokens/s, remaining time: 0:20:25 +pred is: + ['Samarkand'] + label is: + ['Samarkand'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.39656631562175, Em score: 50.256410256410255, current_count: 1170 +2024-07-30 14:13:58,756 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:13:58,757 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 220, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:13:58,757 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:58,757 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:13:58,757 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:13:59,702 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:59,737 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:59,769 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:59,802 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:59,834 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:59,867 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:59,900 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:59,932 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:59,964 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:13:59,997 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:00,322 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.564223051071167 s; generated tokens: 20 tokens; generate speed: 12.785900314091501 tokens/s +2024-07-30 14:14:00,327 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:00,327 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1171/2067], cost time 1.5765s, every example cost time is 1.5765, generate speed: 12.6862 tokens/s, avg speed: 10.2997 tokens/s, remaining time: 0:20:24 +pred is: + ['Captured enemies'] + label is: + ['captured enemies'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:00,413 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:00,413 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 223, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:00,413 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:00,414 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:00,414 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:01,358 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:01,392 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:01,424 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:01,456 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:01,489 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:01,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:01,554 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:01,587 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:01,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:01,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:01,969 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5550329685211182 s; generated tokens: 20 tokens; generate speed: 12.86146365052349 tokens/s +2024-07-30 14:14:01,974 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:01,974 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1172/2067], cost time 1.5671s, every example cost time is 1.5671, generate speed: 12.7623 tokens/s, avg speed: 10.3021 tokens/s, remaining time: 0:20:23 +pred is: + ['They opened the gates to the Mongols.'] + label is: + ['opened the gates'] +The F1/Em of this example is: {'F1': 52.63157894736842, 'Em': 0.0} +2024-07-30 14:14:02,058 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:02,058 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 508, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:02,059 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:02,059 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:02,059 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:03,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:03,041 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:03,073 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:03,105 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:03,137 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:03,169 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:03,201 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:03,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:03,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:03,299 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:03,624 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5642168521881104 s; generated tokens: 20 tokens; generate speed: 12.785950983728968 tokens/s +2024-07-30 14:14:03,629 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:03,629 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1173/2067], cost time 1.5762s, every example cost time is 1.5762, generate speed: 12.6891 tokens/s, avg speed: 10.3044 tokens/s, remaining time: 0:20:22 +pred is: + ['1220'] + label is: + ['1220'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:03,712 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:03,713 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 266, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:03,713 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:03,713 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:03,714 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:04,658 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:04,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:04,722 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:04,754 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:04,786 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:04,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:04,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:04,881 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:04,914 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:04,945 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:05,262 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.547959566116333 s; generated tokens: 20 tokens; generate speed: 12.92023411837422 tokens/s +2024-07-30 14:14:05,267 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:05,267 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1174/2067], cost time 1.5595s, every example cost time is 1.5595, generate speed: 12.8244 tokens/s, avg speed: 10.3069 tokens/s, remaining time: 0:20:21 +pred is: + ['Batu'] + label is: + ['Batu'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:05,349 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:05,350 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 204, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:05,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:05,350 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:05,350 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:06,294 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:06,327 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:06,360 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:06,393 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:06,424 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:06,457 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:06,489 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:06,520 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:06,551 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:06,583 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:06,774 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4234917163848877 s; generated tokens: 16 tokens; generate speed: 11.239967058349832 tokens/s +2024-07-30 14:14:06,779 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:06,779 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1175/2067], cost time 1.4352s, every example cost time is 1.4352, generate speed: 11.1481 tokens/s, avg speed: 10.3076 tokens/s, remaining time: 0:20:19 +pred is: + ['1226'] + label is: + ['1226'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:06,863 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:06,863 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 237, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:06,863 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:06,864 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:06,864 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:07,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:07,842 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:07,875 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:07,906 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:07,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:07,970 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:08,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:08,033 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:08,066 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:08,098 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:08,415 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5507688522338867 s; generated tokens: 20 tokens; generate speed: 12.896828544879494 tokens/s +2024-07-30 14:14:08,420 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:08,420 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1176/2067], cost time 1.5625s, every example cost time is 1.5625, generate speed: 12.8002 tokens/s, avg speed: 10.3100 tokens/s, remaining time: 0:20:18 +pred is: + ['Ning Hia'] + label is: + ['Ning Hia'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:08,503 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:08,504 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 208, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:08,504 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:08,504 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:08,504 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:09,449 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:09,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:09,514 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:09,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:09,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:09,580 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0754742622375488 s; generated tokens: 5 tokens; generate speed: 4.649111722671434 tokens/s +2024-07-30 14:14:09,585 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:09,585 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1177/2067], cost time 1.0871s, every example cost time is 1.0871, generate speed: 4.5993 tokens/s, avg speed: 10.3062 tokens/s, remaining time: 0:20:16 +pred is: + ['Jochi'] + label is: + ['Jochi'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:09,669 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:09,669 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 279, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:09,669 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:09,670 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:09,670 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:10,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:10,654 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:10,687 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:10,720 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:10,752 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:10,784 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:10,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:10,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:10,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:10,914 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:11,238 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.567652940750122 s; generated tokens: 20 tokens; generate speed: 12.757925864911144 tokens/s +2024-07-30 14:14:11,254 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:11,255 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1178/2067], cost time 1.5912s, every example cost time is 1.5912, generate speed: 12.5691 tokens/s, avg speed: 10.3084 tokens/s, remaining time: 0:20:15 +pred is: + ['Chagatai and Jochi'] + label is: + ['Chagatai and Jochi'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:11,339 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:11,340 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 308, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:11,340 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:11,340 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:11,341 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:12,292 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:12,326 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:12,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:12,391 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:12,423 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:12,456 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:12,490 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:12,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:12,554 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:12,586 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:12,904 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.563504934310913 s; generated tokens: 20 tokens; generate speed: 12.79177286946948 tokens/s +2024-07-30 14:14:12,913 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:12,913 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1179/2067], cost time 1.5794s, every example cost time is 1.5794, generate speed: 12.6632 tokens/s, avg speed: 10.3107 tokens/s, remaining time: 0:20:14 +pred is: + ['1226'] + label is: + ['1226'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:12,997 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:12,997 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 267, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:12,998 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:12,998 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:12,998 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:13,945 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:13,980 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:14,011 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:14,043 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:14,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:14,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:14,139 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:14,172 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:14,204 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:14,236 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:14,559 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5607621669769287 s; generated tokens: 20 tokens; generate speed: 12.814252179586335 tokens/s +2024-07-30 14:14:14,564 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:14,564 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1180/2067], cost time 1.5729s, every example cost time is 1.5729, generate speed: 12.7157 tokens/s, avg speed: 10.3131 tokens/s, remaining time: 0:20:13 +pred is: + ['Yinchuan'] + label is: + ['Yinchuan'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.65814760019053, Em score: 50.59322033898305, current_count: 1180 +2024-07-30 14:14:14,988 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:14,988 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 175, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:14,989 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:14,989 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:14,989 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:15,934 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:15,996 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:16,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:16,071 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:16,103 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:16,135 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:16,169 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:16,201 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:16,233 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:16,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:16,588 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5987474918365479 s; generated tokens: 20 tokens; generate speed: 12.509792886070562 tokens/s +2024-07-30 14:14:16,593 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:16,593 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1181/2067], cost time 1.6110s, every example cost time is 1.6110, generate speed: 12.4150 tokens/s, avg speed: 10.3152 tokens/s, remaining time: 0:20:12 +pred is: + ['Without markings'] + label is: + ['without markings'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:16,706 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:16,707 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 278, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:16,707 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:16,707 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:16,708 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:17,654 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:17,688 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:17,719 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:17,751 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:17,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:17,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:17,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:17,852 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1438055038452148 s; generated tokens: 7 tokens; generate speed: 6.119921591973099 tokens/s +2024-07-30 14:14:17,856 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:17,857 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1182/2067], cost time 1.1557s, every example cost time is 1.1557, generate speed: 6.0570 tokens/s, avg speed: 10.3121 tokens/s, remaining time: 0:20:10 +pred is: + ['Edsen Khoroo'] + label is: + ['Edsen Khoroo'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:17,939 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:17,940 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 185, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:17,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:17,941 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:17,941 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:18,885 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:18,919 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:18,950 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:18,983 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:19,014 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:19,046 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:19,079 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:19,111 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:19,142 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:19,175 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:19,306 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.365208387374878 s; generated tokens: 14 tokens; generate speed: 10.25484470317401 tokens/s +2024-07-30 14:14:19,311 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:19,311 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1183/2067], cost time 1.3769s, every example cost time is 1.3769, generate speed: 10.1676 tokens/s, avg speed: 10.3120 tokens/s, remaining time: 0:20:09 +pred is: + ['October 6, 2004'] + label is: + ['October 6, 2004'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:19,395 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:19,396 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 192, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:19,396 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:19,396 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:19,396 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:20,340 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:20,374 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:20,406 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:20,438 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:20,470 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:20,502 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:20,534 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:20,567 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:20,599 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:20,631 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:20,951 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5547394752502441 s; generated tokens: 20 tokens; generate speed: 12.863891551207244 tokens/s +2024-07-30 14:14:20,956 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:20,957 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1184/2067], cost time 1.5665s, every example cost time is 1.5665, generate speed: 12.7670 tokens/s, avg speed: 10.3144 tokens/s, remaining time: 0:20:07 +pred is: + ['Genghis Khan'] + label is: + ['Genghis Khan'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:21,039 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:21,040 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 158, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:21,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:21,040 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:21,040 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:21,984 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:22,017 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:22,049 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:22,081 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:22,084 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.043548583984375 s; generated tokens: 4 tokens; generate speed: 3.8330750109665157 tokens/s +2024-07-30 14:14:22,089 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:22,089 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1185/2067], cost time 1.0550s, every example cost time is 1.0550, generate speed: 3.7915 tokens/s, avg speed: 10.3101 tokens/s, remaining time: 0:20:06 +pred is: + ['Tax exemptions'] + label is: + ['tax exemptions'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:22,172 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:22,172 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 188, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:22,173 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:22,173 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:22,173 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:23,117 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:23,150 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:23,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:23,214 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:23,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:23,277 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:23,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:23,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:23,371 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:23,403 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:23,721 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5469987392425537 s; generated tokens: 20 tokens; generate speed: 12.928258758499352 tokens/s +2024-07-30 14:14:23,725 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:23,726 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1186/2067], cost time 1.5587s, every example cost time is 1.5587, generate speed: 12.8312 tokens/s, avg speed: 10.3125 tokens/s, remaining time: 0:20:05 +pred is: + ['1'] + label is: + ['Töregene Khatun'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:14:23,809 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:23,809 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 254, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:23,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:23,810 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:23,810 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:24,755 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:24,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:24,842 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:24,875 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:24,906 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:24,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:24,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:24,975 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.164517879486084 s; generated tokens: 7 tokens; generate speed: 6.011071296809273 tokens/s +2024-07-30 14:14:24,980 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:24,980 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1187/2067], cost time 1.1761s, every example cost time is 1.1761, generate speed: 5.9518 tokens/s, avg speed: 10.3094 tokens/s, remaining time: 0:20:03 +pred is: + ["Chu'Tsai"] + label is: + ["Chu'Tsai"] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:25,063 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:25,063 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 223, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:25,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:25,064 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:25,064 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:26,009 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:26,043 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:26,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:26,107 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:26,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:26,172 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:26,203 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:26,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:26,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:26,299 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:26,645 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5805745124816895 s; generated tokens: 20 tokens; generate speed: 12.653626793334551 tokens/s +2024-07-30 14:14:26,650 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:26,650 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1188/2067], cost time 1.5925s, every example cost time is 1.5925, generate speed: 12.5589 tokens/s, avg speed: 10.3116 tokens/s, remaining time: 0:20:02 +pred is: + ['Generals'] + label is: + ['his generals'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:14:26,733 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:26,734 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 166, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:26,734 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:26,735 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:26,735 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:27,678 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:27,712 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:27,744 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:27,777 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:27,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:27,840 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:27,872 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:27,904 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:27,935 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:27,967 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:28,286 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.55069899559021 s; generated tokens: 20 tokens; generate speed: 12.897409527493645 tokens/s +2024-07-30 14:14:28,290 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:28,291 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1189/2067], cost time 1.5625s, every example cost time is 1.5625, generate speed: 12.7998 tokens/s, avg speed: 10.3140 tokens/s, remaining time: 0:20:01 +pred is: + ['Rivers'] + label is: + ['rivers'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:28,374 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:28,375 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 209, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:28,375 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:28,375 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:28,376 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:29,320 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:29,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:29,386 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:29,418 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:29,453 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:29,457 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0809447765350342 s; generated tokens: 5 tokens; generate speed: 4.625583201417086 tokens/s +2024-07-30 14:14:29,462 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:29,462 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1190/2067], cost time 1.0927s, every example cost time is 1.0927, generate speed: 4.5760 tokens/s, avg speed: 10.3101 tokens/s, remaining time: 0:19:59 +pred is: + ['Sea of Japan'] + label is: + ['Sea of Japan'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.82908753632339, Em score: 50.84033613445378, current_count: 1190 +2024-07-30 14:14:29,908 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:29,908 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 159, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:29,909 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:29,909 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:29,909 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:30,853 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:30,886 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:30,918 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:30,950 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:30,982 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:31,014 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:31,045 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:31,078 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:31,110 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:31,166 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:31,488 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5781898498535156 s; generated tokens: 20 tokens; generate speed: 12.67274656585604 tokens/s +2024-07-30 14:14:31,493 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:31,493 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1191/2067], cost time 1.5901s, every example cost time is 1.5901, generate speed: 12.5782 tokens/s, avg speed: 10.3123 tokens/s, remaining time: 0:19:58 +pred is: + ['Silk Road'] + label is: + ['the Silk Road'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:14:31,576 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:31,576 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 238, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:31,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:31,577 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:31,577 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:32,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:32,555 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:32,588 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:32,619 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:32,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:32,683 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:32,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:32,746 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:32,778 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:32,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:33,132 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5542259216308594 s; generated tokens: 20 tokens; generate speed: 12.868142090317134 tokens/s +2024-07-30 14:14:33,137 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:33,137 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1192/2067], cost time 1.5661s, every example cost time is 1.5661, generate speed: 12.7708 tokens/s, avg speed: 10.3147 tokens/s, remaining time: 0:19:57 +pred is: + ['1990s'] + label is: + ['1990s'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:33,220 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:33,220 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 189, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:33,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:33,221 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:33,221 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:34,165 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:34,198 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:34,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:34,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:34,292 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:34,324 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:34,327 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1055970191955566 s; generated tokens: 6 tokens; generate speed: 5.426932142387341 tokens/s +2024-07-30 14:14:34,332 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:34,332 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1193/2067], cost time 1.1173s, every example cost time is 1.1173, generate speed: 5.3700 tokens/s, avg speed: 10.3113 tokens/s, remaining time: 0:19:55 +pred is: + ['Tögrög'] + label is: + ['tögrög'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:34,415 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:34,415 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 358, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:34,416 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:34,416 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:34,416 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:35,363 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:35,396 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:35,427 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:35,485 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:35,517 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:35,549 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:35,582 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:35,585 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.168536901473999 s; generated tokens: 7 tokens; generate speed: 5.990397043662173 tokens/s +2024-07-30 14:14:35,590 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:35,590 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1194/2067], cost time 1.1802s, every example cost time is 1.1802, generate speed: 5.9311 tokens/s, avg speed: 10.3081 tokens/s, remaining time: 0:19:54 +pred is: + ['Ikh Zasag'] + label is: + ['Ikh Zasag'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:35,674 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:35,674 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 238, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:35,675 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:35,675 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:35,675 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:36,619 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:36,653 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:36,686 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:36,717 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:36,749 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:36,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:36,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:36,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:36,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:36,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:37,075 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3998651504516602 s; generated tokens: 15 tokens; generate speed: 10.715317825549352 tokens/s +2024-07-30 14:14:37,080 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:37,080 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1195/2067], cost time 1.4116s, every example cost time is 1.4116, generate speed: 10.6259 tokens/s, avg speed: 10.3084 tokens/s, remaining time: 0:19:52 +pred is: + ['Inner Mongolia'] + label is: + ['Inner Mongolia region'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:14:37,165 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:37,165 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 164, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:37,166 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:37,166 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:37,166 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:38,109 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:38,142 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:38,175 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:38,178 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0115540027618408 s; generated tokens: 3 tokens; generate speed: 2.9657339023019187 tokens/s +2024-07-30 14:14:38,183 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:38,183 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1196/2067], cost time 1.0234s, every example cost time is 1.0234, generate speed: 2.9315 tokens/s, avg speed: 10.3038 tokens/s, remaining time: 0:19:51 +pred is: + ['Iran'] + label is: + ['Iran'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:38,266 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:38,267 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 247, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:38,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:38,267 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:38,267 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:39,212 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:39,245 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:39,277 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:39,309 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:39,340 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:39,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:39,404 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:39,470 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:39,502 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:39,534 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:39,863 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.595226526260376 s; generated tokens: 20 tokens; generate speed: 12.537404356536861 tokens/s +2024-07-30 14:14:39,868 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:39,868 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1197/2067], cost time 1.6070s, every example cost time is 1.6070, generate speed: 12.4455 tokens/s, avg speed: 10.3059 tokens/s, remaining time: 0:19:50 +pred is: + ['Hulagu Khan'] + label is: + ['Hulagu Khan'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:39,950 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:39,951 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 183, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:39,951 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:39,951 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:39,952 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:40,895 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:40,929 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:40,961 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:40,993 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:41,025 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:41,056 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:41,088 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:41,119 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:41,150 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:41,182 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:41,495 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5436131954193115 s; generated tokens: 20 tokens; generate speed: 12.956613780803515 tokens/s +2024-07-30 14:14:41,500 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:41,501 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1198/2067], cost time 1.5551s, every example cost time is 1.5551, generate speed: 12.8609 tokens/s, avg speed: 10.3083 tokens/s, remaining time: 0:19:48 +pred is: + ['Mughal Emperors'] + label is: + ['Mughal emperors'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:41,584 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:41,585 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 218, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:41,585 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:41,585 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:41,586 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:42,529 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:42,562 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:42,594 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:42,625 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:42,656 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:42,687 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:42,718 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:42,748 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:42,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:42,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:42,844 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.258073091506958 s; generated tokens: 11 tokens; generate speed: 8.743530144837505 tokens/s +2024-07-30 14:14:42,849 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:42,849 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1199/2067], cost time 1.2696s, every example cost time is 1.2696, generate speed: 8.6640 tokens/s, avg speed: 10.3071 tokens/s, remaining time: 0:19:47 +pred is: + ['tenggis'] + label is: + ['tenggis'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:42,932 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:42,932 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 244, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:42,932 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:42,933 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:42,933 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:43,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:43,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:43,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:43,974 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:44,005 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:44,036 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:44,067 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:44,098 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:44,102 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1684932708740234 s; generated tokens: 8 tokens; generate speed: 6.846423680314449 tokens/s +2024-07-30 14:14:44,106 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:44,107 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1200/2067], cost time 1.1800s, every example cost time is 1.1800, generate speed: 6.7797 tokens/s, avg speed: 10.3045 tokens/s, remaining time: 0:19:45 +pred is: + ['Chinggis Khaan'] + label is: + ['Chinggis Khaan'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 65.08051180685402, Em score: 51.083333333333336, current_count: 1200 +2024-07-30 14:14:44,536 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:44,537 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 280, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:44,537 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:44,537 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:44,537 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:45,483 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:45,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:45,548 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:45,579 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:45,610 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:45,641 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:45,673 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:45,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:45,736 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:45,767 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:46,079 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.541550636291504 s; generated tokens: 20 tokens; generate speed: 12.973949430629046 tokens/s +2024-07-30 14:14:46,084 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:46,084 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1201/2067], cost time 1.5534s, every example cost time is 1.5534, generate speed: 12.8754 tokens/s, avg speed: 10.3070 tokens/s, remaining time: 0:19:44 +pred is: + ['pharma'] + label is: + ['its root word pharma'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 14:14:46,166 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:46,166 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 138, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:46,167 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:46,167 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:46,167 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:47,109 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:47,143 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:47,180 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:47,212 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:47,245 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:47,248 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0807127952575684 s; generated tokens: 5 tokens; generate speed: 4.626576109713164 tokens/s +2024-07-30 14:14:47,253 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:47,253 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1202/2067], cost time 1.0920s, every example cost time is 1.0920, generate speed: 4.5786 tokens/s, avg speed: 10.3031 tokens/s, remaining time: 0:19:43 +pred is: + ['Healthcare professionals'] + label is: + ['healthcare professionals'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:47,336 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:47,336 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 196, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:47,337 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:47,337 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:47,337 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:48,281 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:48,314 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:48,346 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:48,378 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:48,409 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:48,441 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:48,473 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:48,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:48,536 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:48,567 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:48,601 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.264108419418335 s; generated tokens: 11 tokens; generate speed: 8.70178525119034 tokens/s +2024-07-30 14:14:48,606 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:48,607 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1203/2067], cost time 1.2755s, every example cost time is 1.2755, generate speed: 8.6240 tokens/s, avg speed: 10.3018 tokens/s, remaining time: 0:19:41 +pred is: + ['The General Pharmaceutical Council (GPhC)'] + label is: + ['other senior pharmacy technicians'] +The F1/Em of this example is: {'F1': 11.11111111111111, 'Em': 0.0} +2024-07-30 14:14:48,696 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:48,696 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 171, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:48,696 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:48,697 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:48,697 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:49,640 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:49,673 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:49,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:49,742 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:49,774 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:49,806 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:49,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:49,869 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:49,900 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:49,931 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:50,247 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.549466609954834 s; generated tokens: 20 tokens; generate speed: 12.907667626721551 tokens/s +2024-07-30 14:14:50,252 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:50,252 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1204/2067], cost time 1.5614s, every example cost time is 1.5614, generate speed: 12.8091 tokens/s, avg speed: 10.3042 tokens/s, remaining time: 0:19:40 +pred is: + ['He wrote a five volume book on the medicinal properties of plants.'] + label is: + ['writing a five volume book in his native Greek'] +The F1/Em of this example is: {'F1': 43.90243902439025, 'Em': 0.0} +2024-07-30 14:14:50,335 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:50,336 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 223, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:50,336 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:50,336 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:50,336 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:51,281 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:51,314 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:51,346 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:51,378 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:51,410 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:51,442 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:51,475 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:51,507 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:51,538 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:51,570 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:51,888 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5512080192565918 s; generated tokens: 20 tokens; generate speed: 12.893177286167521 tokens/s +2024-07-30 14:14:51,893 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:51,893 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1205/2067], cost time 1.5629s, every example cost time is 1.5629, generate speed: 12.7971 tokens/s, avg speed: 10.3066 tokens/s, remaining time: 0:19:39 +pred is: + ['1'] + label is: + ['highly respected'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:14:51,977 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:51,977 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 518, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:51,978 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:51,978 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:51,978 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:52,925 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:52,959 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:52,992 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:53,023 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:53,055 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:53,087 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:53,119 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:53,150 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:53,182 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:53,213 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:53,530 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5514543056488037 s; generated tokens: 20 tokens; generate speed: 12.891130552269916 tokens/s +2024-07-30 14:14:53,534 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:53,535 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1206/2067], cost time 1.5633s, every example cost time is 1.5633, generate speed: 12.7935 tokens/s, avg speed: 10.3089 tokens/s, remaining time: 0:19:37 +pred is: + ['1'] + label is: + ['botany and chemistry'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:14:53,618 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:53,619 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 190, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:53,619 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:53,619 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:53,620 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:54,563 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:54,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:54,628 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:54,660 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:54,664 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.043975591659546 s; generated tokens: 4 tokens; generate speed: 3.8315072037665536 tokens/s +2024-07-30 14:14:54,669 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:54,669 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1207/2067], cost time 1.0555s, every example cost time is 1.0555, generate speed: 3.7895 tokens/s, avg speed: 10.3048 tokens/s, remaining time: 0:19:36 +pred is: + ['1317'] + label is: + ['1317'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:54,751 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:54,751 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 150, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:54,752 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:54,752 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:54,752 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:55,695 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:55,728 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:55,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:55,792 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:55,823 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:55,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:55,886 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:55,918 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:55,948 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:55,980 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:56,294 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5416245460510254 s; generated tokens: 20 tokens; generate speed: 12.973327423484104 tokens/s +2024-07-30 14:14:56,299 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:56,299 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1208/2067], cost time 1.5534s, every example cost time is 1.5534, generate speed: 12.8748 tokens/s, avg speed: 10.3072 tokens/s, remaining time: 0:19:35 +pred is: + ['Pharmacy legislation'] + label is: + ['pharmacy legislation'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:14:56,382 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:56,383 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 205, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:56,383 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:56,383 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:56,384 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:57,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:57,361 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:57,393 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:57,425 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:57,456 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:57,488 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:57,519 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:57,550 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:57,583 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:57,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:57,942 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.558591604232788 s; generated tokens: 20 tokens; generate speed: 12.832097866871893 tokens/s +2024-07-30 14:14:57,947 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:57,948 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1209/2067], cost time 1.5703s, every example cost time is 1.5703, generate speed: 12.7361 tokens/s, avg speed: 10.3095 tokens/s, remaining time: 0:19:33 +pred is: + ['1'] + label is: + ['a pharmacy practice residency'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:14:58,031 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:58,032 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 213, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:58,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:58,032 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:58,032 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:14:58,976 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:59,010 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:59,041 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:59,072 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:59,103 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:59,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:59,165 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:59,197 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:59,200 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1675620079040527 s; generated tokens: 8 tokens; generate speed: 6.8518844788048465 tokens/s +2024-07-30 14:14:59,205 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:14:59,205 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1210/2067], cost time 1.1793s, every example cost time is 1.1793, generate speed: 6.7836 tokens/s, avg speed: 10.3070 tokens/s, remaining time: 0:19:32 +pred is: + ['Within the premises of the hospital'] + label is: + ['within the premises of the hospital'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.93936175071102, Em score: 50.99173553719008, current_count: 1210 +2024-07-30 14:14:59,637 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:14:59,638 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 140, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:14:59,638 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:14:59,638 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:14:59,638 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:00,582 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:00,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:00,647 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:00,678 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:00,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:00,747 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:00,780 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:00,811 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:00,843 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:00,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:01,188 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5497808456420898 s; generated tokens: 20 tokens; generate speed: 12.905050450351771 tokens/s +2024-07-30 14:15:01,193 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:01,194 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1211/2067], cost time 1.5616s, every example cost time is 1.5616, generate speed: 12.8070 tokens/s, avg speed: 10.3093 tokens/s, remaining time: 0:19:31 +pred is: + ['Optimizes the use of medication and promotes health, wellness, and disease prevention'] + label is: + ['optimizes the use of medication and promotes health, wellness, and disease prevention'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:15:01,279 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:01,280 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 154, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:01,280 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:01,281 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:01,281 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:02,223 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:02,257 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:02,289 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:02,320 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:02,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:02,382 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:02,414 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:02,445 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:02,476 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:02,508 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:02,825 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5437862873077393 s; generated tokens: 20 tokens; generate speed: 12.955161063697924 tokens/s +2024-07-30 14:15:02,830 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:02,830 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1212/2067], cost time 1.5556s, every example cost time is 1.5556, generate speed: 12.8567 tokens/s, avg speed: 10.3117 tokens/s, remaining time: 0:19:29 +pred is: + ['Reviewing all prescribed medications prior to dispensing and administration to the patient'] + label is: + ['creating a comprehensive drug therapy plan for patient-specific problems'] +The F1/Em of this example is: {'F1': 5.0, 'Em': 0.0} +2024-07-30 14:15:02,914 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:02,915 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 172, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:02,915 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:02,915 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:02,915 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:03,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:03,900 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:03,932 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:03,964 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:03,996 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:04,028 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:04,059 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:04,092 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:04,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:04,154 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:04,465 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5488898754119873 s; generated tokens: 20 tokens; generate speed: 12.912473841744381 tokens/s +2024-07-30 14:15:04,469 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:04,470 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1213/2067], cost time 1.5604s, every example cost time is 1.5604, generate speed: 12.8170 tokens/s, avg speed: 10.3141 tokens/s, remaining time: 0:19:28 +pred is: + ['1'] + label is: + ['full independent prescribing authority'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:15:04,553 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:04,554 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 186, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:04,554 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:04,554 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:04,555 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:05,498 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:05,531 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:05,564 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:05,596 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:05,628 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:05,659 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:05,692 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:05,723 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:05,755 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:05,787 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:06,112 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5573468208312988 s; generated tokens: 20 tokens; generate speed: 12.842354530459803 tokens/s +2024-07-30 14:15:06,117 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:06,117 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1214/2067], cost time 1.5688s, every example cost time is 1.5688, generate speed: 12.7490 tokens/s, avg speed: 10.3164 tokens/s, remaining time: 0:19:27 +pred is: + ['1'] + label is: + ['medication regimen review'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:15:06,201 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:06,202 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:06,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:06,202 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:06,203 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:07,146 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:07,179 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:07,211 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:07,241 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:07,273 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:07,305 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:07,336 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:07,367 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:07,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:07,429 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:07,744 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5415301322937012 s; generated tokens: 20 tokens; generate speed: 12.97412199801845 tokens/s +2024-07-30 14:15:07,749 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:07,749 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1215/2067], cost time 1.5533s, every example cost time is 1.5533, generate speed: 12.8762 tokens/s, avg speed: 10.3188 tokens/s, remaining time: 0:19:26 +pred is: + ['2000'] + label is: + ['about the year 2000'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 14:15:07,833 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:07,833 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 159, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:07,833 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:07,834 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:07,834 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:08,777 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:08,811 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:08,842 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:08,873 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:08,904 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:08,935 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:08,967 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:08,998 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:09,029 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:09,060 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:09,373 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5388824939727783 s; generated tokens: 20 tokens; generate speed: 12.99644389895424 tokens/s +2024-07-30 14:15:09,378 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:09,378 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1216/2067], cost time 1.5505s, every example cost time is 1.5505, generate speed: 12.8992 tokens/s, avg speed: 10.3212 tokens/s, remaining time: 0:19:24 +pred is: + ['To avoid the "inconvenience" of visiting a doctor'] + label is: + ['to avoid the "inconvenience" of visiting a doctor or to obtain medications which their doctors were unwilling to prescribe'] +The F1/Em of this example is: {'F1': 60.71428571428571, 'Em': 0.0} +2024-07-30 14:15:09,463 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:09,463 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 213, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:09,464 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:09,464 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:09,464 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:10,408 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:10,442 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:10,483 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:10,515 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:10,546 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:10,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:10,610 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:10,641 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:10,673 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:10,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:11,019 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5541677474975586 s; generated tokens: 20 tokens; generate speed: 12.868623758408948 tokens/s +2024-07-30 14:15:11,023 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:11,024 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1217/2067], cost time 1.5659s, every example cost time is 1.5659, generate speed: 12.7722 tokens/s, avg speed: 10.3235 tokens/s, remaining time: 0:19:23 +pred is: + ['People can obtain controlled substances without a prescription issued by a doctor/practitioner who has an established'] + label is: + ['the ease with which people, youth in particular, can obtain controlled substances'] +The F1/Em of this example is: {'F1': 28.57142857142857, 'Em': 0.0} +2024-07-30 14:15:11,109 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:11,110 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 146, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:11,110 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:11,110 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:11,110 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:12,053 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:12,086 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:12,117 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:12,148 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:12,179 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:12,210 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:12,240 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:12,271 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:12,303 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:12,334 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:12,652 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5414848327636719 s; generated tokens: 20 tokens; generate speed: 12.974503267828286 tokens/s +2024-07-30 14:15:12,657 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:12,657 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1218/2067], cost time 1.5531s, every example cost time is 1.5531, generate speed: 12.8773 tokens/s, avg speed: 10.3259 tokens/s, remaining time: 0:19:22 +pred is: + ['1'] + label is: + ['to reduce consumer costs'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:15:12,742 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:12,742 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 146, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:12,743 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:12,743 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:12,743 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:13,687 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:13,719 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:13,751 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:13,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:13,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:13,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:13,877 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:13,908 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:13,939 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:13,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:14,283 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5395896434783936 s; generated tokens: 20 tokens; generate speed: 12.990474497356333 tokens/s +2024-07-30 14:15:14,288 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:14,288 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1219/2067], cost time 1.5516s, every example cost time is 1.5516, generate speed: 12.8902 tokens/s, avg speed: 10.3282 tokens/s, remaining time: 0:19:21 +pred is: + ['Pharmacy practice science and applied information science'] + label is: + ['pharmacy practice science and applied information science'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:15:14,372 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:14,372 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 188, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:14,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:14,373 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:14,373 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:15,316 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:15,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:15,382 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:15,413 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:15,444 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:15,448 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0745079517364502 s; generated tokens: 5 tokens; generate speed: 4.653292692641119 tokens/s +2024-07-30 14:15:15,452 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:15,453 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1220/2067], cost time 1.0863s, every example cost time is 1.0863, generate speed: 4.6029 tokens/s, avg speed: 10.3245 tokens/s, remaining time: 0:19:19 +pred is: + ['Specialty pharmacies'] + label is: + ['specialty pharmacies'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.75074871528365, Em score: 50.81967213114754, current_count: 1220 +2024-07-30 14:15:15,888 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:15,888 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 166, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:15,889 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:15,889 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:15,889 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:16,832 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:16,866 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:16,898 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:16,929 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:16,960 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:16,992 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:17,023 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:17,055 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:17,087 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:17,118 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:17,428 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.539027214050293 s; generated tokens: 20 tokens; generate speed: 12.995221798167911 tokens/s +2024-07-30 14:15:17,433 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:17,434 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1221/2067], cost time 1.5510s, every example cost time is 1.5510, generate speed: 12.8946 tokens/s, avg speed: 10.3269 tokens/s, remaining time: 0:19:18 +pred is: + ['Pharmacists are regulated separately from physicians.'] + label is: + ['separately from physicians'] +The F1/Em of this example is: {'F1': 58.82352941176471, 'Em': 0.0} +2024-07-30 14:15:17,517 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:17,517 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:17,517 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:17,518 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:17,518 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:18,461 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:18,494 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:18,525 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:18,528 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0101556777954102 s; generated tokens: 3 tokens; generate speed: 2.969839269277066 tokens/s +2024-07-30 14:15:18,533 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:18,533 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1222/2067], cost time 1.0214s, every example cost time is 1.0214, generate speed: 2.9371 tokens/s, avg speed: 10.3224 tokens/s, remaining time: 0:19:16 +pred is: + ['France'] + label is: + ['Austria'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:15:18,616 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:18,616 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 160, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:18,616 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:18,617 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:18,617 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:19,560 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:19,594 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:19,625 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:19,657 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:19,688 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:19,720 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:19,751 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:19,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:19,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:19,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:20,159 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.541846513748169 s; generated tokens: 20 tokens; generate speed: 12.971459754045672 tokens/s +2024-07-30 14:15:20,164 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:20,164 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1223/2067], cost time 1.5533s, every example cost time is 1.5533, generate speed: 12.8761 tokens/s, avg speed: 10.3248 tokens/s, remaining time: 0:19:15 +pred is: + ['1'] + label is: + ['the high risk of a conflict of interest and/or the avoidance of absolute powers'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:15:20,248 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:20,248 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:20,249 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:20,249 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:20,249 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:21,193 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:21,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:21,259 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:21,291 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:21,322 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:21,353 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:21,386 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:21,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:21,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:21,480 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:21,639 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3896517753601074 s; generated tokens: 15 tokens; generate speed: 10.794071051442348 tokens/s +2024-07-30 14:15:21,644 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:21,644 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1224/2067], cost time 1.4015s, every example cost time is 1.4015, generate speed: 10.7029 tokens/s, avg speed: 10.3251 tokens/s, remaining time: 0:19:14 +pred is: + ['Pharmacists will become more integral within the health care system.'] + label is: + ['expected to become more integral within the health care system'] +The F1/Em of this example is: {'F1': 82.05128205128204, 'Em': 0.0} +2024-07-30 14:15:21,728 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:21,729 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 306, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:21,729 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:21,729 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:21,730 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:22,675 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:22,709 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:22,742 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:22,775 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:22,806 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:22,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:22,870 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:22,902 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:22,933 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:22,966 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:23,287 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5572967529296875 s; generated tokens: 20 tokens; generate speed: 12.84276741884596 tokens/s +2024-07-30 14:15:23,292 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:23,293 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1225/2067], cost time 1.5693s, every example cost time is 1.5693, generate speed: 12.7448 tokens/s, avg speed: 10.3273 tokens/s, remaining time: 0:19:13 +pred is: + ['Alberta and British Columbia'] + label is: + ['Alberta and British Columbia'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:15:23,376 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:23,376 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 222, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:23,377 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:23,377 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:23,377 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:24,321 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:24,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:24,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:24,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:24,454 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:24,486 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:24,517 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:24,548 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:24,580 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:24,612 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:24,834 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4571990966796875 s; generated tokens: 17 tokens; generate speed: 11.666216400171729 tokens/s +2024-07-30 14:15:24,839 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:24,840 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1226/2067], cost time 1.4691s, every example cost time is 1.4691, generate speed: 11.5718 tokens/s, avg speed: 10.3284 tokens/s, remaining time: 0:19:11 +pred is: + ['The mortar and pestle and the ℞ (recipere) character'] + label is: + ['the mortar and pestle and the ℞ (recipere) character'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:15:24,923 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:24,923 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 176, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:24,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:24,924 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:24,924 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:25,867 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:25,900 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:25,932 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:25,964 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:25,996 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:26,027 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:26,059 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:26,091 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:26,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:26,154 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:26,410 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.48549222946167 s; generated tokens: 18 tokens; generate speed: 12.117195662829587 tokens/s +2024-07-30 14:15:26,414 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:26,415 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1227/2067], cost time 1.4969s, every example cost time is 1.4969, generate speed: 12.0248 tokens/s, avg speed: 10.3299 tokens/s, remaining time: 0:19:10 +pred is: + ['A system of many biological structures and processes within an organism that protects against disease.'] + label is: + ['a system of many biological structures and processes within an organism that protects against disease'] +The F1/Em of this example is: {'F1': 98.3050847457627, 'Em': 0.0} +2024-07-30 14:15:26,499 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:26,500 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 229, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:26,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:26,501 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:26,501 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:27,445 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:27,478 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:27,510 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:27,542 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:27,574 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:27,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:27,640 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:27,673 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:27,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:27,737 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:28,057 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5559437274932861 s; generated tokens: 20 tokens; generate speed: 12.853935297660884 tokens/s +2024-07-30 14:15:28,062 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:28,062 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1228/2067], cost time 1.5678s, every example cost time is 1.5678, generate speed: 12.7571 tokens/s, avg speed: 10.3322 tokens/s, remaining time: 0:19:09 +pred is: + ['They evolve and adapt'] + label is: + ['Pathogens can rapidly evolve and adapt'] +The F1/Em of this example is: {'F1': 66.66666666666666, 'Em': 0.0} +2024-07-30 14:15:28,146 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:28,146 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 194, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:28,146 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:28,147 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:28,147 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:29,091 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:29,124 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:29,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:29,187 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:29,219 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:29,222 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.074927806854248 s; generated tokens: 5 tokens; generate speed: 4.651475167092744 tokens/s +2024-07-30 14:15:29,227 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:29,227 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1229/2067], cost time 1.0866s, every example cost time is 1.0866, generate speed: 4.6014 tokens/s, avg speed: 10.3285 tokens/s, remaining time: 0:19:07 +pred is: + ['Autoimmune diseases'] + label is: + ['autoimmune diseases, inflammatory diseases and cancer'] +The F1/Em of this example is: {'F1': 40.0, 'Em': 0.0} +2024-07-30 14:15:29,310 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:29,311 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 271, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:29,311 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:29,311 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:29,311 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:30,257 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:30,290 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:30,323 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:30,355 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:30,388 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:30,419 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:30,451 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:30,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:30,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:30,548 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:30,710 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3981256484985352 s; generated tokens: 15 tokens; generate speed: 10.728649471604136 tokens/s +2024-07-30 14:15:30,715 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:30,715 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1230/2067], cost time 1.4097s, every example cost time is 1.4097, generate speed: 10.6403 tokens/s, avg speed: 10.3288 tokens/s, remaining time: 0:19:06 +pred is: + ['The plague of Athens in 430 BC'] + label is: + ['plague of Athens in 430 BC'] +The F1/Em of this example is: {'F1': 91.66666666666666, 'Em': 0.0} +F1 score: 64.74262330259202, Em score: 50.56910569105691, current_count: 1230 +2024-07-30 14:15:31,153 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:31,154 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 209, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:31,154 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:31,154 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:31,155 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:32,098 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:32,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:32,163 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:32,194 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:32,225 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:32,256 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:32,259 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.104416847229004 s; generated tokens: 6 tokens; generate speed: 5.432731323371313 tokens/s +2024-07-30 14:15:32,264 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:32,264 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1231/2067], cost time 1.1162s, every example cost time is 1.1162, generate speed: 5.3752 tokens/s, avg speed: 10.3255 tokens/s, remaining time: 0:19:04 +pred is: + ['Adaptive immune system'] + label is: + ['immunological memory'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 14:15:32,348 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:32,348 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 144, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:32,348 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:32,349 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:32,349 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:33,291 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:33,324 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:33,356 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:33,388 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:33,392 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0429179668426514 s; generated tokens: 4 tokens; generate speed: 3.8353927414920963 tokens/s +2024-07-30 14:15:33,397 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:33,397 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1232/2067], cost time 1.0542s, every example cost time is 1.0542, generate speed: 3.7944 tokens/s, avg speed: 10.3214 tokens/s, remaining time: 0:19:03 +pred is: + ['Self molecules'] + label is: + ['self and non-self'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:15:33,480 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:33,480 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 181, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:33,481 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:33,481 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:33,481 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:34,425 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:34,458 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:34,489 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:34,520 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:34,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:34,555 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0741608142852783 s; generated tokens: 5 tokens; generate speed: 4.654796501142973 tokens/s +2024-07-30 14:15:34,560 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:34,560 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1233/2067], cost time 1.0857s, every example cost time is 1.0857, generate speed: 4.6052 tokens/s, avg speed: 10.3177 tokens/s, remaining time: 0:19:01 +pred is: + ['Pattern recognition receptors'] + label is: + ['pattern recognition receptors'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:15:34,643 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:34,643 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 198, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:34,644 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:34,644 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:34,644 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:35,588 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:35,621 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:35,652 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:35,683 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:35,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:35,745 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:35,776 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:35,806 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:35,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:35,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:35,904 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2596936225891113 s; generated tokens: 11 tokens; generate speed: 8.73228204282812 tokens/s +2024-07-30 14:15:35,909 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:35,909 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1234/2067], cost time 1.2712s, every example cost time is 1.2712, generate speed: 8.6533 tokens/s, avg speed: 10.3165 tokens/s, remaining time: 0:19:00 +pred is: + ['exoskeleton'] + label is: + ['exoskeleton'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:15:35,992 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:35,992 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:35,992 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:35,993 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:35,993 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:36,936 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:36,970 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:37,004 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:37,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:37,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:37,072 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.079378604888916 s; generated tokens: 5 tokens; generate speed: 4.632294893889039 tokens/s +2024-07-30 14:15:37,077 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:37,078 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1235/2067], cost time 1.0908s, every example cost time is 1.0908, generate speed: 4.5840 tokens/s, avg speed: 10.3128 tokens/s, remaining time: 0:18:58 +pred is: + ['β-defensins'] + label is: + ['β-defensins'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:15:37,160 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:37,160 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 232, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:37,160 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:37,161 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:37,161 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:38,105 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:38,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:38,170 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:38,203 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:38,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:38,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:38,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:38,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:38,360 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:38,391 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:38,711 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.550307035446167 s; generated tokens: 20 tokens; generate speed: 12.9006703464028 tokens/s +2024-07-30 14:15:38,716 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:38,716 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1236/2067], cost time 1.5618s, every example cost time is 1.5618, generate speed: 12.8054 tokens/s, avg speed: 10.3151 tokens/s, remaining time: 0:18:57 +pred is: + ['Probiotic flora'] + label is: + ['commensal flora'] +The F1/Em of this example is: {'F1': 66.66666666666666, 'Em': 0.0} +2024-07-30 14:15:38,801 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:38,802 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 239, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:38,802 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:38,802 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:38,802 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:39,748 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:39,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:39,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:39,846 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:39,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:39,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:39,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:39,974 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:40,006 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:40,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:40,103 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3008368015289307 s; generated tokens: 12 tokens; generate speed: 9.22483126699358 tokens/s +2024-07-30 14:15:40,108 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:40,109 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1237/2067], cost time 1.3126s, every example cost time is 1.3126, generate speed: 9.1419 tokens/s, avg speed: 10.3142 tokens/s, remaining time: 0:18:55 +pred is: + ['Inflammation'] + label is: + ['Inflammation'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:15:40,192 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:40,192 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 246, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:40,193 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:40,193 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:40,193 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:41,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:41,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:41,204 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:41,235 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:41,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:41,270 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0765917301177979 s; generated tokens: 5 tokens; generate speed: 4.6442860929768734 tokens/s +2024-07-30 14:15:41,275 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:41,275 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1238/2067], cost time 1.0883s, every example cost time is 1.0883, generate speed: 4.5945 tokens/s, avg speed: 10.3105 tokens/s, remaining time: 0:18:54 +pred is: + ['Phagocytes'] + label is: + ['phagocytes'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:15:41,357 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:41,357 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 230, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:41,358 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:41,358 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:41,358 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:42,303 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:42,335 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:42,367 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:42,399 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:42,430 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:42,463 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:42,499 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:42,530 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:42,561 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:42,593 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:42,906 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.547985315322876 s; generated tokens: 20 tokens; generate speed: 12.920019203042916 tokens/s +2024-07-30 14:15:42,911 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:42,912 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1239/2067], cost time 1.5594s, every example cost time is 1.5594, generate speed: 12.8251 tokens/s, avg speed: 10.3128 tokens/s, remaining time: 0:18:53 +pred is: + ['1'] + label is: + ['Neutrophils and macrophages'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:15:42,994 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:42,995 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 154, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:42,995 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:42,995 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:42,996 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:43,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:43,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:44,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:44,053 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:44,087 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:44,090 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.094477653503418 s; generated tokens: 5 tokens; generate speed: 4.568389298762769 tokens/s +2024-07-30 14:15:44,095 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:44,095 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1240/2067], cost time 1.1057s, every example cost time is 1.1057, generate speed: 4.5221 tokens/s, avg speed: 10.3090 tokens/s, remaining time: 0:18:51 +pred is: + ['Leukocytes'] + label is: + ['Leukocytes'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.8186236523023, Em score: 50.645161290322584, current_count: 1240 +2024-07-30 14:15:44,539 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:44,540 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:44,540 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:44,540 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:44,540 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:45,483 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:45,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:45,548 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:45,579 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:45,610 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:45,641 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:45,644 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1037507057189941 s; generated tokens: 6 tokens; generate speed: 5.436010114341482 tokens/s +2024-07-30 14:15:45,649 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:45,649 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1241/2067], cost time 1.1155s, every example cost time is 1.1155, generate speed: 5.3790 tokens/s, avg speed: 10.3058 tokens/s, remaining time: 0:18:50 +pred is: + ['Dendritic cells'] + label is: + ['Dendritic cells'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:15:45,732 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:45,732 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 269, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:45,733 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:45,733 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:45,733 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:46,678 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:46,711 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:46,744 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:46,776 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:46,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:46,839 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:46,871 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:46,903 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:46,934 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:46,966 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:47,305 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5721914768218994 s; generated tokens: 20 tokens; generate speed: 12.72109682239782 tokens/s +2024-07-30 14:15:47,310 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:47,311 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1242/2067], cost time 1.5836s, every example cost time is 1.5836, generate speed: 12.6298 tokens/s, avg speed: 10.3080 tokens/s, remaining time: 0:18:48 +pred is: + ['missing self'] + label is: + ['missing self'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:15:47,393 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:47,393 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 175, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:47,394 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:47,394 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:47,394 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:48,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:48,371 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:48,403 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:48,435 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:48,468 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:48,471 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0763847827911377 s; generated tokens: 5 tokens; generate speed: 4.64517901027425 tokens/s +2024-07-30 14:15:48,476 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:48,476 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1243/2067], cost time 1.0878s, every example cost time is 1.0878, generate speed: 4.5965 tokens/s, avg speed: 10.3043 tokens/s, remaining time: 0:18:47 +pred is: + ['Vertebrates'] + label is: + ['vertebrates'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:15:48,558 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:48,559 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 232, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:48,559 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:48,559 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:48,560 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:49,504 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:49,537 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:49,569 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:49,600 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:49,632 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:49,663 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:49,695 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:49,726 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:49,757 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:49,788 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:49,790 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2307078838348389 s; generated tokens: 10 tokens; generate speed: 8.125405005808837 tokens/s +2024-07-30 14:15:49,795 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:49,795 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1244/2067], cost time 1.2420s, every example cost time is 1.2420, generate speed: 8.0514 tokens/s, avg speed: 10.3027 tokens/s, remaining time: 0:18:45 +pred is: + ['Killer T cells and helper T cells'] + label is: + ['killer T cell and the helper T cell'] +The F1/Em of this example is: {'F1': 35.71428571428571, 'Em': 0.0} +2024-07-30 14:15:49,878 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:49,878 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 292, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:49,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:49,879 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:49,879 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:50,825 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:50,858 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:50,890 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:50,922 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:50,953 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:50,984 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:50,988 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1079976558685303 s; generated tokens: 6 tokens; generate speed: 5.415173911443664 tokens/s +2024-07-30 14:15:50,992 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:50,993 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1245/2067], cost time 1.1193s, every example cost time is 1.1193, generate speed: 5.3603 tokens/s, avg speed: 10.2994 tokens/s, remaining time: 0:18:44 +pred is: + ['Killer T cells'] + label is: + ['Killer T cells'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:15:51,075 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:51,075 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 313, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:51,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:51,076 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:51,076 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:52,021 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:52,054 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:52,086 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:52,090 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.013381004333496 s; generated tokens: 3 tokens; generate speed: 2.960387048080805 tokens/s +2024-07-30 14:15:52,095 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:52,095 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1246/2067], cost time 1.0248s, every example cost time is 1.0248, generate speed: 2.9273 tokens/s, avg speed: 10.2950 tokens/s, remaining time: 0:18:42 +pred is: + ['CD4'] + label is: + ['CD4 co-receptor'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:15:52,178 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:52,178 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 272, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:52,178 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:52,179 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:52,179 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:53,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:53,157 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:53,189 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:53,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:53,254 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:53,287 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:53,318 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:53,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:53,383 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:53,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:53,737 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5578553676605225 s; generated tokens: 20 tokens; generate speed: 12.838162267935433 tokens/s +2024-07-30 14:15:53,742 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:53,743 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1247/2067], cost time 1.5699s, every example cost time is 1.5699, generate speed: 12.7397 tokens/s, avg speed: 10.2972 tokens/s, remaining time: 0:18:41 +pred is: + ['Cytotoxic T cells'] + label is: + ['helper T cells, cytotoxic T cells and NK cells'] +The F1/Em of this example is: {'F1': 43.47826086956522, 'Em': 0.0} +2024-07-30 14:15:53,826 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:53,826 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 233, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:53,827 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:53,827 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:53,827 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:54,772 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:54,805 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:54,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:54,841 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.013794183731079 s; generated tokens: 3 tokens; generate speed: 2.9591805202107824 tokens/s +2024-07-30 14:15:54,846 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:54,846 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1248/2067], cost time 1.0256s, every example cost time is 1.0256, generate speed: 2.9251 tokens/s, avg speed: 10.2928 tokens/s, remaining time: 0:18:39 +pred is: + ['B cell'] + label is: + ['B cell'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:15:54,928 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:54,928 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 162, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:54,929 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:54,929 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:54,929 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:55,873 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:55,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:55,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:55,970 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:55,973 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0437180995941162 s; generated tokens: 4 tokens; generate speed: 3.8324524615943045 tokens/s +2024-07-30 14:15:55,978 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:55,978 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1249/2067], cost time 1.0551s, every example cost time is 1.0551, generate speed: 3.7910 tokens/s, avg speed: 10.2888 tokens/s, remaining time: 0:18:38 +pred is: + ['Memory cells'] + label is: + ['long-lived memory cells'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:15:56,062 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:56,063 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 225, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:56,063 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:56,063 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:56,063 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:57,008 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:57,041 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:57,073 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:57,104 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:57,135 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:57,166 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:57,197 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:57,228 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:57,259 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:57,291 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:57,627 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5632429122924805 s; generated tokens: 20 tokens; generate speed: 12.79391695476821 tokens/s +2024-07-30 14:15:57,632 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:57,632 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1250/2067], cost time 1.5750s, every example cost time is 1.5750, generate speed: 12.6986 tokens/s, avg speed: 10.2910 tokens/s, remaining time: 0:18:37 +pred is: + ['1'] + label is: + ['microbes'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 64.86342870035095, Em score: 50.64, current_count: 1250 +2024-07-30 14:15:58,075 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:58,075 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 163, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:58,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:58,076 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:58,076 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:15:59,020 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:59,053 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:59,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:59,115 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:59,146 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:59,177 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:59,208 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:59,239 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:59,270 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:59,301 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:59,365 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.288560152053833 s; generated tokens: 12 tokens; generate speed: 9.312720078199863 tokens/s +2024-07-30 14:15:59,370 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:15:59,370 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1251/2067], cost time 1.3003s, every example cost time is 1.3003, generate speed: 9.2283 tokens/s, avg speed: 10.2902 tokens/s, remaining time: 0:18:35 +pred is: + ['immunomodulators'] + label is: + ['immunomodulators'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:15:59,483 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:15:59,483 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 166, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:15:59,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:15:59,484 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:15:59,484 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:00,428 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:00,462 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:00,494 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:00,525 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:00,557 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:00,560 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0751631259918213 s; generated tokens: 5 tokens; generate speed: 4.650457106578667 tokens/s +2024-07-30 14:16:00,565 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:00,565 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1252/2067], cost time 1.0868s, every example cost time is 1.0868, generate speed: 4.6005 tokens/s, avg speed: 10.2866 tokens/s, remaining time: 0:18:34 +pred is: + ['NFIL3'] + label is: + ['NFIL3'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:16:00,647 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:00,648 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:00,648 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:00,648 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:00,649 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:01,592 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:01,625 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:01,657 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:01,688 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:01,719 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:01,751 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:01,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:01,813 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:01,844 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:01,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:02,190 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5413103103637695 s; generated tokens: 20 tokens; generate speed: 12.975972369431394 tokens/s +2024-07-30 14:16:02,195 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:02,195 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1253/2067], cost time 1.5531s, every example cost time is 1.5531, generate speed: 12.8775 tokens/s, avg speed: 10.2889 tokens/s, remaining time: 0:18:32 +pred is: + ['1'] + label is: + ['decline in hormone levels with age'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:16:02,279 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:02,279 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 168, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:02,280 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:02,280 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:02,280 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:03,223 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:03,257 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:03,289 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:03,320 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:03,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:03,355 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0743732452392578 s; generated tokens: 5 tokens; generate speed: 4.6538761293208895 tokens/s +2024-07-30 14:16:03,359 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:03,360 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1254/2067], cost time 1.0859s, every example cost time is 1.0859, generate speed: 4.6043 tokens/s, avg speed: 10.2853 tokens/s, remaining time: 0:18:31 +pred is: + ['Helper T cells'] + label is: + ['killer T cells'] +The F1/Em of this example is: {'F1': 80.00000000000001, 'Em': 0.0} +2024-07-30 14:16:03,442 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:03,442 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 184, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:03,443 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:03,443 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:03,443 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:04,387 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:04,420 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:04,452 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:04,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:04,515 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:04,546 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:04,550 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.106691598892212 s; generated tokens: 6 tokens; generate speed: 5.421564603911284 tokens/s +2024-07-30 14:16:04,555 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:04,555 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1255/2067], cost time 1.1185s, every example cost time is 1.1185, generate speed: 5.3645 tokens/s, avg speed: 10.2821 tokens/s, remaining time: 0:18:29 +pred is: + ['phagocytic cells'] + label is: + ['phagocytic cells'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:16:04,638 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:04,638 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 157, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:04,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:04,639 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:04,639 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:05,582 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:05,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:05,673 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:05,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:05,736 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:05,769 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:05,800 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:05,831 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:05,862 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:05,893 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:06,208 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5686650276184082 s; generated tokens: 20 tokens; generate speed: 12.749694579705501 tokens/s +2024-07-30 14:16:06,213 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:06,213 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1256/2067], cost time 1.5805s, every example cost time is 1.5805, generate speed: 12.6539 tokens/s, avg speed: 10.2843 tokens/s, remaining time: 0:18:28 +pred is: + ['Autoimmune disorders'] + label is: + ['autoimmune disorders'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:16:06,296 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:06,297 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:06,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:06,297 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:06,297 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:07,242 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:07,275 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:07,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:07,337 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:07,370 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:07,401 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:07,404 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1061322689056396 s; generated tokens: 6 tokens; generate speed: 5.424306087676246 tokens/s +2024-07-30 14:16:07,408 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:07,409 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1257/2067], cost time 1.1175s, every example cost time is 1.1175, generate speed: 5.3690 tokens/s, avg speed: 10.2811 tokens/s, remaining time: 0:18:27 +pred is: + ['Immunodeficiencies'] + label is: + ['Immunodeficiencies'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:16:07,492 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:07,492 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 179, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:07,493 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:07,493 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:07,493 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:08,437 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:08,471 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:08,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:08,534 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:08,567 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:08,598 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:08,630 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:08,633 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1390836238861084 s; generated tokens: 7 tokens; generate speed: 6.145290699657971 tokens/s +2024-07-30 14:16:08,637 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:08,638 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1258/2067], cost time 1.1508s, every example cost time is 1.1508, generate speed: 6.0828 tokens/s, avg speed: 10.2783 tokens/s, remaining time: 0:18:25 +pred is: + ['1'] + label is: + ['vaccination'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:16:08,719 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:08,720 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 169, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:08,720 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:08,720 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:08,721 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:09,663 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:09,696 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:09,731 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:09,763 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:09,795 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:09,826 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:09,875 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:09,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:09,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:09,970 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:10,283 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5620200634002686 s; generated tokens: 20 tokens; generate speed: 12.80393284863652 tokens/s +2024-07-30 14:16:10,288 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:10,288 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1259/2067], cost time 1.5734s, every example cost time is 1.5734, generate speed: 12.7111 tokens/s, avg speed: 10.2805 tokens/s, remaining time: 0:18:24 +pred is: + ['1'] + label is: + ['enzymes'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:16:10,371 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:10,371 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 200, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:10,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:10,372 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:10,372 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:11,316 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:11,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:11,382 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:11,413 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:11,473 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:11,506 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:11,537 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:11,568 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:11,600 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:11,631 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:11,697 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.324951171875 s; generated tokens: 12 tokens; generate speed: 9.056937534549474 tokens/s +2024-07-30 14:16:11,702 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:11,702 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1260/2067], cost time 1.3365s, every example cost time is 1.3365, generate speed: 8.9784 tokens/s, avg speed: 10.2795 tokens/s, remaining time: 0:18:22 +pred is: + ['Frank Burnet'] + label is: + ['Frank Burnet'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.88832212336405, Em score: 50.714285714285715, current_count: 1260 +2024-07-30 14:16:12,148 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:12,148 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 209, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:12,148 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:12,149 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:12,149 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:13,093 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:13,126 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:13,157 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:13,189 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:13,220 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:13,251 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:13,254 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1052379608154297 s; generated tokens: 6 tokens; generate speed: 5.428695188476227 tokens/s +2024-07-30 14:16:13,259 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:13,259 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1261/2067], cost time 1.1171s, every example cost time is 1.1171, generate speed: 5.3712 tokens/s, avg speed: 10.2763 tokens/s, remaining time: 0:18:21 +pred is: + ['Glucocorticoids'] + label is: + ['Glucocorticoids'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:16:13,342 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:13,342 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 201, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:13,343 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:13,343 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:13,343 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:14,287 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:14,320 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:14,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:14,382 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:14,413 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:14,443 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:14,474 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:14,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:14,536 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:14,566 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:14,846 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5024752616882324 s; generated tokens: 19 tokens; generate speed: 12.64579889232316 tokens/s +2024-07-30 14:16:14,851 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:14,851 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1262/2067], cost time 1.5141s, every example cost time is 1.5141, generate speed: 12.5486 tokens/s, avg speed: 10.2783 tokens/s, remaining time: 0:18:20 +pred is: + ['Cytotoxic natural killer cells and CTLs (cytotoxic T lymphocytes)'] + label is: + ['cytotoxic natural killer cells and CTLs (cytotoxic T lymphocytes)'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:16:14,934 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:14,935 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 238, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:14,935 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:14,935 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:14,936 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:15,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:15,913 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:15,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:15,976 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:16,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:16,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:16,041 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1056644916534424 s; generated tokens: 6 tokens; generate speed: 5.426600967376123 tokens/s +2024-07-30 14:16:16,046 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:16,047 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1263/2067], cost time 1.1171s, every example cost time is 1.1171, generate speed: 5.3712 tokens/s, avg speed: 10.2751 tokens/s, remaining time: 0:18:18 +pred is: + ['A vitamin D receptor'] + label is: + ['a vitamin D receptor'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:16:16,158 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:16,159 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 162, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:16,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:16,159 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:16,160 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:17,103 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:17,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:17,168 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:17,200 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:17,203 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0431125164031982 s; generated tokens: 4 tokens; generate speed: 3.8346774073736305 tokens/s +2024-07-30 14:16:17,208 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:17,208 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1264/2067], cost time 1.0550s, every example cost time is 1.0550, generate speed: 3.7913 tokens/s, avg speed: 10.2712 tokens/s, remaining time: 0:18:17 +pred is: + ['Pattern recognition receptors'] + label is: + ['Pattern recognition receptors'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:16:17,291 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:17,292 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 200, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:17,292 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:17,293 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:17,293 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:18,237 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:18,270 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:18,301 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:18,332 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:18,363 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:18,395 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:18,426 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:18,456 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:18,487 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:18,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:18,856 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5627105236053467 s; generated tokens: 20 tokens; generate speed: 12.798275622959126 tokens/s +2024-07-30 14:16:18,861 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:18,861 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1265/2067], cost time 1.5747s, every example cost time is 1.5747, generate speed: 12.7011 tokens/s, avg speed: 10.2734 tokens/s, remaining time: 0:18:15 +pred is: + ['Immunoglobulins and T cell receptors'] + label is: + ['immunoglobulins and T cell receptors'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:16:18,946 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:18,947 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 237, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:18,947 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:18,947 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:18,948 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:19,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:19,925 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:19,958 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:19,990 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:20,021 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:20,053 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:20,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:20,114 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:20,145 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:20,176 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:20,489 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5409083366394043 s; generated tokens: 20 tokens; generate speed: 12.979357385799062 tokens/s +2024-07-30 14:16:20,494 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:20,494 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1266/2067], cost time 1.5529s, every example cost time is 1.5529, generate speed: 12.8795 tokens/s, avg speed: 10.2757 tokens/s, remaining time: 0:18:14 +pred is: + ['1'] + label is: + ['lymphocytes'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:16:20,576 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:20,576 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 218, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:20,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:20,577 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:20,577 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:21,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:21,554 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:21,585 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:21,616 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:21,647 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:21,677 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:21,708 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:21,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:21,769 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:21,800 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:22,131 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.553243637084961 s; generated tokens: 20 tokens; generate speed: 12.876280013311279 tokens/s +2024-07-30 14:16:22,136 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:22,136 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1267/2067], cost time 1.5644s, every example cost time is 1.5644, generate speed: 12.7841 tokens/s, avg speed: 10.2780 tokens/s, remaining time: 0:18:13 +pred is: + ['1'] + label is: + ['"cellular" and "humoral" theories of immunity'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:16:22,218 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:22,219 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 158, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:22,219 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:22,219 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:22,219 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:23,162 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:23,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:23,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:23,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:23,289 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:23,320 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:23,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:23,381 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:23,412 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:23,442 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:23,751 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5312142372131348 s; generated tokens: 20 tokens; generate speed: 13.06152954559822 tokens/s +2024-07-30 14:16:23,756 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:23,756 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1268/2067], cost time 1.5425s, every example cost time is 1.5425, generate speed: 12.9662 tokens/s, avg speed: 10.2804 tokens/s, remaining time: 0:18:12 +pred is: + ['1'] + label is: + ['cancers'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:16:23,838 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:23,838 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 304, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:23,839 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:23,839 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:23,839 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:24,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:24,818 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:24,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:24,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:24,913 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:24,945 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:24,978 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:25,009 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:25,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:25,077 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:25,327 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.487614631652832 s; generated tokens: 18 tokens; generate speed: 12.099907877351868 tokens/s +2024-07-30 14:16:25,332 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:25,332 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1269/2067], cost time 1.4991s, every example cost time is 1.4991, generate speed: 12.0074 tokens/s, avg speed: 10.2819 tokens/s, remaining time: 0:18:10 +pred is: + ['Type I hypersensitivity'] + label is: + ['Hypersensitivity'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +2024-07-30 14:16:25,415 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:25,415 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 310, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:25,416 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:25,416 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:25,416 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:26,361 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:26,394 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:26,426 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:26,457 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:26,487 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:26,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:26,549 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:26,580 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:26,610 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:26,641 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:26,953 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5370533466339111 s; generated tokens: 20 tokens; generate speed: 13.011910122572678 tokens/s +2024-07-30 14:16:26,958 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:26,959 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1270/2067], cost time 1.5487s, every example cost time is 1.5487, generate speed: 12.9142 tokens/s, avg speed: 10.2842 tokens/s, remaining time: 0:18:09 +pred is: + ['Intracellular pathogenesis'] + label is: + ['intracellular pathogenesis'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.87607811714332, Em score: 50.78740157480315, current_count: 1270 +2024-07-30 14:16:27,422 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:27,422 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 268, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:27,423 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:27,423 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:27,423 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:28,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:28,402 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:28,433 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:28,465 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:28,496 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:28,527 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:28,558 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:28,589 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:28,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:28,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:28,684 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2608089447021484 s; generated tokens: 11 tokens; generate speed: 8.724557393268354 tokens/s +2024-07-30 14:16:28,689 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:28,690 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1271/2067], cost time 1.2727s, every example cost time is 1.2727, generate speed: 8.6429 tokens/s, avg speed: 10.2830 tokens/s, remaining time: 0:18:08 +pred is: + ['antigenic variation'] + label is: + ['antigenic variation'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:16:28,772 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:28,773 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 230, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:28,773 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:28,773 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:28,774 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:29,718 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:29,752 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:29,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:29,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:29,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:29,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:29,912 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:29,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:29,976 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:30,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:30,322 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5477113723754883 s; generated tokens: 20 tokens; generate speed: 12.922306030034019 tokens/s +2024-07-30 14:16:30,326 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:30,327 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1272/2067], cost time 1.5593s, every example cost time is 1.5593, generate speed: 12.8266 tokens/s, avg speed: 10.2853 tokens/s, remaining time: 0:18:06 +pred is: + ['Immune surveillance'] + label is: + ['immune surveillance'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:16:30,411 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:30,411 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 310, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:30,412 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:30,412 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:30,412 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:31,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:31,391 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:31,422 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:31,454 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:31,485 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:31,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:31,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:31,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:31,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:31,611 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1989965438842773 s; generated tokens: 9 tokens; generate speed: 7.506276849509122 tokens/s +2024-07-30 14:16:31,616 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:31,616 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1273/2067], cost time 1.2107s, every example cost time is 1.2107, generate speed: 7.4338 tokens/s, avg speed: 10.2833 tokens/s, remaining time: 0:18:05 +pred is: + ['500 Da'] + label is: + ['>500 Da'] +The F1/Em of this example is: {'F1': 85.71428571428571, 'Em': 0.0} +2024-07-30 14:16:31,699 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:31,699 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 343, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:31,699 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:31,700 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:31,700 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:32,645 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:32,679 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:32,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:32,741 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:32,773 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:32,804 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:32,807 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.106548547744751 s; generated tokens: 6 tokens; generate speed: 5.42226548688583 tokens/s +2024-07-30 14:16:32,811 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:32,812 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1274/2067], cost time 1.1179s, every example cost time is 1.1179, generate speed: 5.3673 tokens/s, avg speed: 10.2802 tokens/s, remaining time: 0:18:03 +pred is: + ['Prolactin'] + label is: + ['leptin, pituitary growth hormone, and prolactin'] +The F1/Em of this example is: {'F1': 14.285714285714288, 'Em': 0.0} +2024-07-30 14:16:32,895 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:32,895 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 231, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:32,896 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:32,896 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:32,896 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:33,840 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:33,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:33,905 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:33,937 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:33,969 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:34,000 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:34,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:34,063 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:34,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:34,126 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:34,441 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5450294017791748 s; generated tokens: 20 tokens; generate speed: 12.944737476820213 tokens/s +2024-07-30 14:16:34,446 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:34,446 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1275/2067], cost time 1.5565s, every example cost time is 1.5565, generate speed: 12.8494 tokens/s, avg speed: 10.2825 tokens/s, remaining time: 0:18:02 +pred is: + ['1'] + label is: + ['carbohydrates'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:16:34,529 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:34,530 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 201, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:34,530 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:34,530 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:34,531 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:35,474 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:35,507 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:35,539 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:35,570 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:35,601 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:35,604 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0731744766235352 s; generated tokens: 5 tokens; generate speed: 4.65907465087243 tokens/s +2024-07-30 14:16:35,609 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:35,609 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1276/2067], cost time 1.0848s, every example cost time is 1.0848, generate speed: 4.6092 tokens/s, avg speed: 10.2789 tokens/s, remaining time: 0:18:01 +pred is: + ['Civil disobedience'] + label is: + ['Civil disobedience'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:16:35,691 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:35,692 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 183, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:35,692 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:35,692 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:35,692 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:36,635 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:36,669 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:36,700 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:36,731 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:36,762 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:36,765 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0724022388458252 s; generated tokens: 5 tokens; generate speed: 4.662429654549452 tokens/s +2024-07-30 14:16:36,770 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:36,770 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1277/2067], cost time 1.0837s, every example cost time is 1.0837, generate speed: 4.6136 tokens/s, avg speed: 10.2754 tokens/s, remaining time: 0:17:59 +pred is: + ['Antigone'] + label is: + ['Antigone'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:16:36,853 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:36,853 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 219, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:36,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:36,854 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:36,854 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:37,798 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:37,832 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:37,863 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:37,895 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:37,925 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:37,956 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:37,988 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:38,019 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:38,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:38,081 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:38,393 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5388576984405518 s; generated tokens: 20 tokens; generate speed: 12.996653309963364 tokens/s +2024-07-30 14:16:38,398 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:38,398 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1278/2067], cost time 1.5503s, every example cost time is 1.5503, generate speed: 12.9011 tokens/s, avg speed: 10.2778 tokens/s, remaining time: 0:17:58 +pred is: + ['Percy Shelley'] + label is: + ['Percy Shelley'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:16:38,481 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:38,482 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 155, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:38,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:38,482 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:38,482 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:39,425 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:39,461 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:39,494 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:39,526 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:39,558 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:39,589 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:39,621 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:39,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:39,686 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:39,718 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:40,031 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5482580661773682 s; generated tokens: 20 tokens; generate speed: 12.917743131401716 tokens/s +2024-07-30 14:16:40,036 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:40,036 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1279/2067], cost time 1.5597s, every example cost time is 1.5597, generate speed: 12.8227 tokens/s, avg speed: 10.2800 tokens/s, remaining time: 0:17:57 +pred is: + ['muggers, arsonists, draft evaders, campaign hecklers, campus militants, anti'] + label is: + ['muggers, arsonists, draft evaders, campaign hecklers, campus militants, anti-war demonstrators, juvenile delinquents and political assassins'] +The F1/Em of this example is: {'F1': 73.68421052631578, 'Em': 0.0} +2024-07-30 14:16:40,121 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:40,121 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:40,121 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:40,122 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:40,122 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:41,065 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:41,098 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:41,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:41,161 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:41,193 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:41,225 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:41,256 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:41,288 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:41,320 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:41,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:41,667 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5450403690338135 s; generated tokens: 20 tokens; generate speed: 12.944645590397707 tokens/s +2024-07-30 14:16:41,672 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:41,672 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1280/2067], cost time 1.5565s, every example cost time is 1.5565, generate speed: 12.8491 tokens/s, avg speed: 10.2823 tokens/s, remaining time: 0:17:55 +pred is: + ['LeGrande'] + label is: + ['LeGrande'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.97367454632683, Em score: 50.859375, current_count: 1280 +2024-07-30 14:16:42,137 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:42,138 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 155, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:42,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:42,138 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:42,139 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:43,082 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:43,115 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:43,145 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:43,178 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:43,210 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:43,241 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:43,273 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:43,304 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:43,335 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:43,366 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:43,678 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.539567232131958 s; generated tokens: 20 tokens; generate speed: 12.990663598564936 tokens/s +2024-07-30 14:16:43,683 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:43,683 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1281/2067], cost time 1.5514s, every example cost time is 1.5514, generate speed: 12.8912 tokens/s, avg speed: 10.2846 tokens/s, remaining time: 0:17:54 +pred is: + ['Constitutional impasse'] + label is: + ['constitutional impasse'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:16:43,767 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:43,768 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 320, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:43,768 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:43,768 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:43,768 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:44,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:44,747 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:44,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:44,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:44,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:44,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:44,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:44,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:44,974 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:45,005 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:45,132 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3630707263946533 s; generated tokens: 14 tokens; generate speed: 10.270927053822257 tokens/s +2024-07-30 14:16:45,137 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:45,137 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1282/2067], cost time 1.3747s, every example cost time is 1.3747, generate speed: 10.1843 tokens/s, avg speed: 10.2845 tokens/s, remaining time: 0:17:53 +pred is: + ['1'] + label is: + ['Thoreau'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:16:45,218 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:45,219 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 138, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:45,219 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:45,219 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:45,220 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:46,162 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:46,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:46,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:46,259 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:46,290 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:46,321 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:46,352 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:46,383 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:46,414 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:46,445 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:46,765 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5454258918762207 s; generated tokens: 20 tokens; generate speed: 12.941416411575094 tokens/s +2024-07-30 14:16:46,770 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:46,770 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1283/2067], cost time 1.5569s, every example cost time is 1.5569, generate speed: 12.8462 tokens/s, avg speed: 10.2868 tokens/s, remaining time: 0:17:51 +pred is: + ['1'] + label is: + ['governmental entities'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:16:46,854 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:46,854 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 282, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:46,855 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:46,855 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:46,855 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:47,801 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:47,834 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:47,865 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:47,896 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:47,927 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:47,959 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:47,990 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:48,021 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:48,052 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:48,083 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:48,178 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3224008083343506 s; generated tokens: 13 tokens; generate speed: 9.830605001198041 tokens/s +2024-07-30 14:16:48,183 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:48,183 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1284/2067], cost time 1.3339s, every example cost time is 1.3339, generate speed: 9.7455 tokens/s, avg speed: 10.2864 tokens/s, remaining time: 0:17:50 +pred is: + ['Civil disobedience'] + label is: + ['civil disobedience'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:16:48,265 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:48,265 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 219, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:48,265 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:48,266 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:48,266 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:49,209 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:49,242 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:49,274 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:49,305 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:49,336 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:49,367 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:49,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:49,428 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:49,459 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:49,490 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:49,803 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5369925498962402 s; generated tokens: 20 tokens; generate speed: 13.01242481712105 tokens/s +2024-07-30 14:16:49,808 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:49,808 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1285/2067], cost time 1.5484s, every example cost time is 1.5484, generate speed: 12.9168 tokens/s, avg speed: 10.2887 tokens/s, remaining time: 0:17:49 +pred is: + ['1'] + label is: + ['non-violence'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:16:49,891 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:49,891 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 267, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:49,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:49,892 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:49,892 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:50,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:50,871 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:50,902 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:50,933 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:50,963 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:50,994 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:51,024 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:51,055 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:51,059 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1662428379058838 s; generated tokens: 8 tokens; generate speed: 6.859634837599408 tokens/s +2024-07-30 14:16:51,063 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:51,064 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1286/2067], cost time 1.1778s, every example cost time is 1.1778, generate speed: 6.7922 tokens/s, avg speed: 10.2864 tokens/s, remaining time: 0:17:47 +pred is: + ['Revolutionary civil disobedience'] + label is: + ['Revolutionary civil disobedience'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:16:51,146 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:51,146 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 243, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:51,146 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:51,147 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:51,147 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:52,091 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:52,124 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:52,154 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:52,185 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:52,216 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:52,247 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:52,278 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:52,309 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:52,340 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:52,371 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:52,681 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5342953205108643 s; generated tokens: 20 tokens; generate speed: 13.035300135922158 tokens/s +2024-07-30 14:16:52,686 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:52,686 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1287/2067], cost time 1.5455s, every example cost time is 1.5455, generate speed: 12.9409 tokens/s, avg speed: 10.2887 tokens/s, remaining time: 0:17:46 +pred is: + ['Roman Empire'] + label is: + ['during the Roman Empire'] +The F1/Em of this example is: {'F1': 60.0, 'Em': 0.0} +2024-07-30 14:16:52,769 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:52,769 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 295, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:52,770 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:52,770 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:52,770 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:53,715 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:53,749 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:53,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:53,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:53,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:53,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:53,909 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:53,941 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:53,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:54,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:54,098 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.327409267425537 s; generated tokens: 13 tokens; generate speed: 9.793513062638953 tokens/s +2024-07-30 14:16:54,102 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:54,103 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1288/2067], cost time 1.3386s, every example cost time is 1.3386, generate speed: 9.7117 tokens/s, avg speed: 10.2883 tokens/s, remaining time: 0:17:45 +pred is: + ['1'] + label is: + ['illegal'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:16:54,185 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:54,185 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:54,186 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:54,186 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:54,186 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:55,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:55,162 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:55,193 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:55,224 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:55,255 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:55,286 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:55,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:55,348 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:55,378 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:55,409 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:55,718 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.531677484512329 s; generated tokens: 20 tokens; generate speed: 13.057579158949249 tokens/s +2024-07-30 14:16:55,723 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:55,723 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1289/2067], cost time 1.5431s, every example cost time is 1.5431, generate speed: 12.9611 tokens/s, avg speed: 10.2906 tokens/s, remaining time: 0:17:43 +pred is: + ['Threatening government officials'] + label is: + ['sending an email to the Lebanon, New Hampshire city councilors'] +The F1/Em of this example is: {'F1': 8.000000000000002, 'Em': 0.0} +2024-07-30 14:16:55,806 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:55,807 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 198, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:55,807 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:55,807 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:55,807 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:56,751 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:56,787 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:56,818 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:56,849 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:56,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:56,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:56,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:56,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:57,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:57,033 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:57,341 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5330698490142822 s; generated tokens: 20 tokens; generate speed: 13.045720006077609 tokens/s +2024-07-30 14:16:57,346 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:57,346 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1290/2067], cost time 1.5445s, every example cost time is 1.5445, generate speed: 12.9494 tokens/s, avg speed: 10.2929 tokens/s, remaining time: 0:17:42 +pred is: + ['It to be more difficult for a system to function'] + label is: + ['system to function'] +The F1/Em of this example is: {'F1': 41.66666666666667, 'Em': 0.0} +F1 score: 64.7875737100504, Em score: 50.69767441860465, current_count: 1290 +2024-07-30 14:16:57,805 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:57,806 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 354, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:57,806 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:57,807 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:57,807 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:58,752 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:58,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:58,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:58,819 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0124895572662354 s; generated tokens: 3 tokens; generate speed: 2.9629935227185227 tokens/s +2024-07-30 14:16:58,824 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:16:58,824 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1291/2067], cost time 1.0241s, every example cost time is 1.0241, generate speed: 2.9294 tokens/s, avg speed: 10.2887 tokens/s, remaining time: 0:17:41 +pred is: + ['Federal'] + label is: + ['criminal investigations'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:16:58,906 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:16:58,907 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 189, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:16:58,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:58,907 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:16:58,908 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:16:59,851 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:59,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:59,915 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:59,947 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:16:59,978 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:00,009 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:00,039 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:00,070 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:00,073 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1657140254974365 s; generated tokens: 8 tokens; generate speed: 6.862746629977467 tokens/s +2024-07-30 14:17:00,078 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:00,079 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1292/2067], cost time 1.1768s, every example cost time is 1.1768, generate speed: 6.7980 tokens/s, avg speed: 10.2863 tokens/s, remaining time: 0:17:39 +pred is: + ['The validity of the social contract'] + label is: + ['accept punishment'] +The F1/Em of this example is: {'F1': 14.285714285714288, 'Em': 0.0} +2024-07-30 14:17:00,161 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:00,161 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 314, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:00,162 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:00,162 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:00,162 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:01,106 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:01,139 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:01,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:01,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:01,233 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:01,264 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:01,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:01,326 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:01,328 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.166163682937622 s; generated tokens: 8 tokens; generate speed: 6.860100444774285 tokens/s +2024-07-30 14:17:01,333 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:01,333 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1293/2067], cost time 1.1772s, every example cost time is 1.1772, generate speed: 6.7957 tokens/s, avg speed: 10.2840 tokens/s, remaining time: 0:17:38 +pred is: + ['Whether or not to plead guilty'] + label is: + ['whether or not to plead guilty'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:17:01,416 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:01,416 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 233, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:01,416 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:01,417 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:01,417 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:02,361 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:02,394 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:02,425 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:02,455 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:02,486 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:02,517 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:02,548 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:02,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:02,609 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:02,640 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:02,673 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.255713701248169 s; generated tokens: 11 tokens; generate speed: 8.75995857102307 tokens/s +2024-07-30 14:17:02,678 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:02,678 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1294/2067], cost time 1.2668s, every example cost time is 1.2668, generate speed: 8.6832 tokens/s, avg speed: 10.2829 tokens/s, remaining time: 0:17:36 +pred is: + ['1'] + label is: + ['Camp Mercury nuclear test site'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:17:02,760 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:02,761 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 195, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:02,761 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:02,761 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:02,761 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:03,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:03,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:03,770 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:03,802 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:03,833 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:03,864 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:03,895 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:03,925 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:03,956 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:03,987 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:04,083 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.320969820022583 s; generated tokens: 13 tokens; generate speed: 9.84125435945066 tokens/s +2024-07-30 14:17:04,087 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:04,088 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1295/2067], cost time 1.3322s, every example cost time is 1.3322, generate speed: 9.7583 tokens/s, avg speed: 10.2825 tokens/s, remaining time: 0:17:35 +pred is: + ['To continue their protest'] + label is: + ['a way of continuing their protest'] +The F1/Em of this example is: {'F1': 44.44444444444444, 'Em': 0.0} +2024-07-30 14:17:04,170 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:04,170 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 188, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:04,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:04,171 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:04,171 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:05,115 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:05,148 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:05,179 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:05,210 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:05,241 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:05,244 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0726940631866455 s; generated tokens: 5 tokens; generate speed: 4.66116124959854 tokens/s +2024-07-30 14:17:05,249 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:05,249 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1296/2067], cost time 1.0840s, every example cost time is 1.0840, generate speed: 4.6127 tokens/s, avg speed: 10.2790 tokens/s, remaining time: 0:17:33 +pred is: + ['Plea bargain'] + label is: + ['plea bargain'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:17:05,331 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:05,331 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 216, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:05,332 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:05,332 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:05,332 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:06,276 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:06,310 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:06,342 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:06,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:06,404 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:06,434 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:06,466 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:06,496 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:06,527 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:06,558 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:06,866 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5329868793487549 s; generated tokens: 20 tokens; generate speed: 13.046426078021243 tokens/s +2024-07-30 14:17:06,870 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:06,871 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1297/2067], cost time 1.5444s, every example cost time is 1.5444, generate speed: 12.9500 tokens/s, avg speed: 10.2813 tokens/s, remaining time: 0:17:32 +pred is: + ['1'] + label is: + ['defiant speech'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:17:06,954 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:06,954 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 265, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:06,954 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:06,955 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:06,955 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:07,899 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:07,932 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:07,963 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:07,994 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:08,024 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:08,055 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:08,086 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:08,117 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:08,148 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:08,179 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:08,488 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5333707332611084 s; generated tokens: 20 tokens; generate speed: 13.043160121795752 tokens/s +2024-07-30 14:17:08,493 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:08,493 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1298/2067], cost time 1.5446s, every example cost time is 1.5446, generate speed: 12.9480 tokens/s, avg speed: 10.2837 tokens/s, remaining time: 0:17:31 +pred is: + ['1'] + label is: + ['acquittal and avoid imprisonment'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:17:08,576 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:08,576 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 230, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:08,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:08,577 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:08,577 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:09,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:09,554 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:09,585 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:09,616 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:09,647 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:09,677 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:09,708 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:09,741 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:09,773 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:09,815 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:10,124 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5470349788665771 s; generated tokens: 20 tokens; generate speed: 12.92795591128317 tokens/s +2024-07-30 14:17:10,129 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:10,130 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1299/2067], cost time 1.5584s, every example cost time is 1.5584, generate speed: 12.8340 tokens/s, avg speed: 10.2859 tokens/s, remaining time: 0:17:29 +pred is: + ['1'] + label is: + ['general disobedience'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:17:10,212 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:10,212 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 332, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:10,213 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:10,213 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:10,213 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:11,158 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:11,192 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:11,224 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:11,254 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:11,285 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:11,316 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:11,347 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:11,377 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:11,408 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:11,439 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:11,595 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.381514310836792 s; generated tokens: 15 tokens; generate speed: 10.857650827311666 tokens/s +2024-07-30 14:17:11,600 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:11,600 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1300/2067], cost time 1.3928s, every example cost time is 1.3928, generate speed: 10.7700 tokens/s, avg speed: 10.2863 tokens/s, remaining time: 0:17:28 +pred is: + ['Indirect civil disobedience'] + label is: + ['Indirect civil disobedience'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.5651540343809, Em score: 50.53846153846154, current_count: 1300 +2024-07-30 14:17:12,060 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:12,060 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 202, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:12,061 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:12,061 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:12,061 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:13,004 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:13,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:13,068 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:13,099 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:13,130 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:13,160 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:13,191 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:13,222 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:13,252 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:13,283 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:13,591 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5293998718261719 s; generated tokens: 20 tokens; generate speed: 13.077024765353945 tokens/s +2024-07-30 14:17:13,596 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:13,596 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1301/2067], cost time 1.5412s, every example cost time is 1.5412, generate speed: 12.9766 tokens/s, avg speed: 10.2886 tokens/s, remaining time: 0:17:27 +pred is: + ['1'] + label is: + ['incapacitation'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:17:13,678 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:13,678 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 133, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:13,679 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:13,679 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:13,679 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:14,622 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:14,655 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:14,686 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:14,689 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0095627307891846 s; generated tokens: 3 tokens; generate speed: 2.971583546526992 tokens/s +2024-07-30 14:17:14,694 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:14,694 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1302/2067], cost time 1.0208s, every example cost time is 1.0208, generate speed: 2.9390 tokens/s, avg speed: 10.2844 tokens/s, remaining time: 0:17:25 +pred is: + ['Construction'] + label is: + ['Construction'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:17:14,779 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:14,780 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:14,780 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:14,780 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:14,781 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:15,724 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:15,757 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:15,787 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:15,818 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:15,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:15,881 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:15,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:15,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:15,973 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:16,004 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:16,312 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5308895111083984 s; generated tokens: 20 tokens; generate speed: 13.064300104531744 tokens/s +2024-07-30 14:17:16,316 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:16,317 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1303/2067], cost time 1.5430s, every example cost time is 1.5430, generate speed: 12.9617 tokens/s, avg speed: 10.2867 tokens/s, remaining time: 0:17:24 +pred is: + ['Architect'] + label is: + ['An architect'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:17:16,399 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:16,399 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 143, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:16,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:16,400 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:16,400 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:17,342 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:17,375 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:17,406 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:17,437 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:17,468 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:17,499 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:17,530 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:17,560 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:17,591 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:17,622 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:17,930 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5298244953155518 s; generated tokens: 20 tokens; generate speed: 13.073395060179545 tokens/s +2024-07-30 14:17:17,935 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:17,935 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1304/2067], cost time 1.5412s, every example cost time is 1.5412, generate speed: 12.9767 tokens/s, avg speed: 10.2890 tokens/s, remaining time: 0:17:23 +pred is: + ['buildings, infrastructure and industrial'] + label is: + ['buildings, infrastructure and industrial'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:17:18,018 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:18,018 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 201, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:18,019 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:18,019 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:18,019 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:18,963 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:18,996 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:19,027 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:19,058 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:19,088 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:19,119 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:19,151 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:19,181 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:19,212 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:19,243 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:19,493 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4740321636199951 s; generated tokens: 18 tokens; generate speed: 12.211402467497576 tokens/s +2024-07-30 14:17:19,498 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:19,499 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1305/2067], cost time 1.4853s, every example cost time is 1.4853, generate speed: 12.1188 tokens/s, avg speed: 10.2906 tokens/s, remaining time: 0:17:21 +pred is: + ['A trade magazine for the construction industry.'] + label is: + ['a trade magazine for the construction industry'] +The F1/Em of this example is: {'F1': 96.2962962962963, 'Em': 0.0} +2024-07-30 14:17:19,581 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:19,582 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 145, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:19,582 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:19,582 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:19,582 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:20,525 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:20,557 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:20,589 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:20,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:20,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:20,682 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:20,713 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:20,744 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:20,776 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:20,807 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:21,120 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5369200706481934 s; generated tokens: 20 tokens; generate speed: 13.013038466967924 tokens/s +2024-07-30 14:17:21,124 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:21,125 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1306/2067], cost time 1.5485s, every example cost time is 1.5485, generate speed: 12.9154 tokens/s, avg speed: 10.2928 tokens/s, remaining time: 0:17:20 +pred is: + ['building construction, heavy and civil engineering construction, and specialty trade contractors'] + label is: + ['building construction, heavy and civil engineering construction, and specialty trade contractors'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:17:21,208 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:21,209 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 185, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:21,209 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:21,210 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:21,210 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:22,153 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:22,187 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:22,219 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:22,250 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:22,282 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:22,313 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:22,344 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:22,375 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:22,406 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:22,437 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:22,752 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5422720909118652 s; generated tokens: 20 tokens; generate speed: 12.967880387548893 tokens/s +2024-07-30 14:17:22,757 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:22,758 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1307/2067], cost time 1.5541s, every example cost time is 1.5541, generate speed: 12.8689 tokens/s, avg speed: 10.2951 tokens/s, remaining time: 0:17:19 +pred is: + ['Building construction'] + label is: + ['Building construction'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:17:22,840 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:22,840 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:22,840 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:22,841 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:22,841 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:23,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:23,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:23,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:23,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:23,909 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:23,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:23,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:24,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:24,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:24,063 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:24,373 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5318975448608398 s; generated tokens: 20 tokens; generate speed: 13.055703409862723 tokens/s +2024-07-30 14:17:24,378 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:24,378 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1308/2067], cost time 1.5431s, every example cost time is 1.5431, generate speed: 12.9606 tokens/s, avg speed: 10.2974 tokens/s, remaining time: 0:17:18 +pred is: + ['1'] + label is: + ['local building authority regulations and codes of practice'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:17:24,461 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:24,461 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 231, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:24,461 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:24,462 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:24,462 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:25,406 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:25,439 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:25,471 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:25,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:25,535 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:25,567 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:25,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:25,628 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:25,660 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:25,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:26,001 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.539318323135376 s; generated tokens: 20 tokens; generate speed: 12.992764199196174 tokens/s +2024-07-30 14:17:26,006 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:26,007 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1309/2067], cost time 1.5507s, every example cost time is 1.5507, generate speed: 12.8971 tokens/s, avg speed: 10.2996 tokens/s, remaining time: 0:17:16 +pred is: + ['3D printing technology'] + label is: + ['3D printing technology'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:17:26,090 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:26,090 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 231, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:26,090 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:26,091 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:26,091 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:27,035 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:27,068 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:27,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:27,130 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:27,162 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:27,193 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:27,223 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:27,254 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:27,286 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:27,318 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:27,634 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5430095195770264 s; generated tokens: 20 tokens; generate speed: 12.961682832314898 tokens/s +2024-07-30 14:17:27,646 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:27,646 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1310/2067], cost time 1.5612s, every example cost time is 1.5612, generate speed: 12.8108 tokens/s, avg speed: 10.3018 tokens/s, remaining time: 0:17:15 +pred is: + ['1'] + label is: + ['plan the physical proceedings, and to integrate those proceedings with the other parts'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 64.56564621449729, Em score: 50.534351145038165, current_count: 1310 +2024-07-30 14:17:28,112 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:28,112 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 202, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:28,113 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:28,113 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:28,113 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:29,063 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:29,096 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:29,128 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:29,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:29,190 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:29,222 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:29,253 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:29,284 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:29,315 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:29,347 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:29,665 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5516963005065918 s; generated tokens: 20 tokens; generate speed: 12.889120115495846 tokens/s +2024-07-30 14:17:29,680 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:29,680 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1311/2067], cost time 1.5733s, every example cost time is 1.5733, generate speed: 12.7123 tokens/s, avg speed: 10.3039 tokens/s, remaining time: 0:17:14 +pred is: + ['previously separated specialties'] + label is: + ['previously separated specialties'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:17:29,763 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:29,763 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 130, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:29,764 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:29,764 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:29,764 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:30,709 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:30,742 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:30,774 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:30,805 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:30,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:30,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:30,900 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:30,931 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:30,963 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:30,995 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:31,308 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.543748378753662 s; generated tokens: 20 tokens; generate speed: 12.95547919288952 tokens/s +2024-07-30 14:17:31,314 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:31,314 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1312/2067], cost time 1.5565s, every example cost time is 1.5565, generate speed: 12.8495 tokens/s, avg speed: 10.3061 tokens/s, remaining time: 0:17:13 +pred is: + ['Design-build, partnering and construction management'] + label is: + ['design-build, partnering and construction management'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:17:31,398 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:31,398 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 178, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:31,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:31,398 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:31,399 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:32,342 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:32,375 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:32,407 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:32,438 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:32,469 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:32,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:32,532 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:32,562 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:32,593 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:32,625 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:32,949 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5497221946716309 s; generated tokens: 20 tokens; generate speed: 12.905538856425672 tokens/s +2024-07-30 14:17:32,953 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:32,954 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1313/2067], cost time 1.5611s, every example cost time is 1.5611, generate speed: 12.8113 tokens/s, avg speed: 10.3083 tokens/s, remaining time: 0:17:11 +pred is: + ['1'] + label is: + ['preventable financial problems'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:17:33,037 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:33,037 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 207, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:33,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:33,038 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:33,038 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:33,982 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:34,016 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:34,048 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:34,080 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:34,112 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:34,145 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:34,177 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:34,208 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:34,239 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:34,271 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:34,584 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.54548978805542 s; generated tokens: 20 tokens; generate speed: 12.940881366265499 tokens/s +2024-07-30 14:17:34,589 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:34,589 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1314/2067], cost time 1.5570s, every example cost time is 1.5570, generate speed: 12.8449 tokens/s, avg speed: 10.3105 tokens/s, remaining time: 0:17:10 +pred is: + ['1'] + label is: + ['Mortgage bankers, accountants, and cost engineers'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:17:34,676 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:34,676 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 202, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:34,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:34,677 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:34,677 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:35,621 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:35,657 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:35,689 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:35,720 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:35,751 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:35,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:35,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:35,844 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:35,881 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:35,923 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:36,239 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.561730146408081 s; generated tokens: 20 tokens; generate speed: 12.806309749478311 tokens/s +2024-07-30 14:17:36,244 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:36,244 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1315/2067], cost time 1.5737s, every example cost time is 1.5737, generate speed: 12.7085 tokens/s, avg speed: 10.3126 tokens/s, remaining time: 0:17:09 +pred is: + ['1'] + label is: + ['zoning and building code requirements'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:17:36,327 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:36,328 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 203, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:36,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:36,328 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:36,328 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:37,273 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:37,308 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:37,340 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:37,371 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:37,403 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:37,434 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:37,466 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:37,497 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:37,528 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:37,560 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:37,873 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5438613891601562 s; generated tokens: 20 tokens; generate speed: 12.954530853886942 tokens/s +2024-07-30 14:17:37,877 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:37,878 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1316/2067], cost time 1.5553s, every example cost time is 1.5553, generate speed: 12.8594 tokens/s, avg speed: 10.3148 tokens/s, remaining time: 0:17:08 +pred is: + ['1'] + label is: + ['A construction project'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:17:37,960 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:37,960 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 162, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:37,961 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:37,961 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:37,961 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:38,904 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:38,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:38,969 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:39,001 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:39,033 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:39,063 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:39,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:39,125 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:39,156 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:39,187 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:39,566 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.6045794486999512 s; generated tokens: 20 tokens; generate speed: 12.464325163957591 tokens/s +2024-07-30 14:17:39,571 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:39,571 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1317/2067], cost time 1.6158s, every example cost time is 1.6158, generate speed: 12.3778 tokens/s, avg speed: 10.3166 tokens/s, remaining time: 0:17:06 +pred is: + ['1'] + label is: + ['relationship contracting where the emphasis is on a co-operative relationship'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:17:39,654 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:39,654 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 156, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:39,655 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:39,655 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:39,655 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:40,598 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:40,633 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:40,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:40,696 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:40,726 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:40,757 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:40,790 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:40,821 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:40,852 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:40,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:41,193 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5378947257995605 s; generated tokens: 20 tokens; generate speed: 13.004791332255778 tokens/s +2024-07-30 14:17:41,198 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:41,198 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1318/2067], cost time 1.5492s, every example cost time is 1.5492, generate speed: 12.9103 tokens/s, avg speed: 10.3189 tokens/s, remaining time: 0:17:05 +pred is: + ['The architect or engineer'] + label is: + ['the architect or engineer'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:17:41,281 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:41,281 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 185, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:41,282 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:41,282 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:41,282 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:42,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:42,260 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:42,291 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:42,322 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:42,353 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:42,384 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:42,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:42,446 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:42,476 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:42,507 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:42,818 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5352764129638672 s; generated tokens: 20 tokens; generate speed: 13.026970147603448 tokens/s +2024-07-30 14:17:42,823 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:42,823 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1319/2067], cost time 1.5466s, every example cost time is 1.5466, generate speed: 12.9319 tokens/s, avg speed: 10.3211 tokens/s, remaining time: 0:17:04 +pred is: + ['1'] + label is: + ['The owner'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:17:42,905 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:42,905 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 168, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:42,906 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:42,906 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:42,906 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:43,849 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:43,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:43,914 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:43,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:43,975 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:44,006 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:44,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:44,068 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:44,099 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:44,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:44,347 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4408442974090576 s; generated tokens: 17 tokens; generate speed: 11.79863780602081 tokens/s +2024-07-30 14:17:44,352 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:44,352 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1320/2067], cost time 1.4520s, every example cost time is 1.4520, generate speed: 11.7078 tokens/s, avg speed: 10.3222 tokens/s, remaining time: 0:17:03 +pred is: + ['1'] + label is: + ['contractors'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 64.30378525832687, Em score: 50.378787878787875, current_count: 1320 +2024-07-30 14:17:44,842 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:44,842 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 204, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:44,843 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:44,843 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:44,843 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:45,787 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:45,822 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:45,853 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:45,884 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:45,915 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:45,946 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:45,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:46,008 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:46,010 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1669001579284668 s; generated tokens: 8 tokens; generate speed: 6.855770774940983 tokens/s +2024-07-30 14:17:46,015 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:46,015 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1321/2067], cost time 1.1784s, every example cost time is 1.1784, generate speed: 6.7891 tokens/s, avg speed: 10.3199 tokens/s, remaining time: 0:17:01 +pred is: + ['960'] + label is: + ['$960 billion'] +The F1/Em of this example is: {'F1': 40.0, 'Em': 0.0} +2024-07-30 14:17:46,098 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:46,098 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 226, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:46,099 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:46,099 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:46,099 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:47,043 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:47,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:47,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:47,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:47,170 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:47,200 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:47,203 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1039621829986572 s; generated tokens: 6 tokens; generate speed: 5.434968780997907 tokens/s +2024-07-30 14:17:47,208 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:47,208 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1322/2067], cost time 1.1151s, every example cost time is 1.1151, generate speed: 5.3805 tokens/s, avg speed: 10.3169 tokens/s, remaining time: 0:17:00 +pred is: + ['£42,090'] + label is: + ['£42,090'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:17:47,290 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:47,290 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 184, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:47,291 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:47,291 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:47,292 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:48,235 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:48,269 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:48,302 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:48,305 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0126500129699707 s; generated tokens: 3 tokens; generate speed: 2.962524032564213 tokens/s +2024-07-30 14:17:48,310 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:48,310 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1323/2067], cost time 1.0247s, every example cost time is 1.0247, generate speed: 2.9276 tokens/s, avg speed: 10.3127 tokens/s, remaining time: 0:16:58 +pred is: + ['Construction'] + label is: + ['Construction'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:17:48,392 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:48,392 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 174, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:48,393 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:48,393 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:48,393 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:49,336 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:49,368 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:49,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:49,432 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:49,464 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:49,495 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:49,527 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:49,558 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:49,590 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:49,621 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:49,936 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5421245098114014 s; generated tokens: 20 tokens; generate speed: 12.969121411892973 tokens/s +2024-07-30 14:17:49,940 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:49,941 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1324/2067], cost time 1.5535s, every example cost time is 1.5535, generate speed: 12.8745 tokens/s, avg speed: 10.3149 tokens/s, remaining time: 0:16:57 +pred is: + ['independent schools'] + label is: + ['independent'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:17:50,048 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:50,049 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 151, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:50,049 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:50,049 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:50,050 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:50,993 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:51,026 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:51,057 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:51,088 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:51,119 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:51,150 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:51,181 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:51,212 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:51,242 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:51,273 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:51,553 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5036208629608154 s; generated tokens: 19 tokens; generate speed: 12.63616412091187 tokens/s +2024-07-30 14:17:51,558 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:51,559 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1325/2067], cost time 1.5154s, every example cost time is 1.5154, generate speed: 12.5383 tokens/s, avg speed: 10.3167 tokens/s, remaining time: 0:16:55 +pred is: + ['$45,000'] + label is: + ['$45,000'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:17:51,641 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:51,641 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 206, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:51,642 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:51,642 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:51,642 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:52,586 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:52,619 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:52,650 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:52,681 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:52,712 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:52,743 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:52,773 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:52,804 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:52,835 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:52,866 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:52,929 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2872719764709473 s; generated tokens: 12 tokens; generate speed: 9.32203933538425 tokens/s +2024-07-30 14:17:52,934 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:52,934 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1326/2067], cost time 1.2983s, every example cost time is 1.2983, generate speed: 9.2431 tokens/s, avg speed: 10.3160 tokens/s, remaining time: 0:16:54 +pred is: + ['Lower sixth'] + label is: + ['lower sixth'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:17:53,017 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:53,017 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:53,017 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:53,017 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:53,018 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:53,960 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:53,993 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:54,042 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:54,074 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:54,105 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:54,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:54,167 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:54,198 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:54,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:54,260 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:54,263 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2447762489318848 s; generated tokens: 10 tokens; generate speed: 8.033572305529432 tokens/s +2024-07-30 14:17:54,267 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:54,268 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1327/2067], cost time 1.2559s, every example cost time is 1.2559, generate speed: 7.9627 tokens/s, avg speed: 10.3144 tokens/s, remaining time: 0:16:53 +pred is: + ['Roman Catholic'] + label is: + ['Roman Catholic'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:17:54,350 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:54,350 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 194, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:54,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:54,351 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:54,351 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:55,294 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:55,327 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:55,358 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:55,389 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:55,392 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0411200523376465 s; generated tokens: 4 tokens; generate speed: 3.842016097008913 tokens/s +2024-07-30 14:17:55,397 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:55,397 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1328/2067], cost time 1.0522s, every example cost time is 1.0522, generate speed: 3.8016 tokens/s, avg speed: 10.3106 tokens/s, remaining time: 0:16:51 +pred is: + ['Expulsion'] + label is: + ['expulsion'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:17:55,479 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:55,479 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 238, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:55,479 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:55,480 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:55,480 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:56,423 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:56,456 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:56,487 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:56,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:56,549 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:56,580 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:56,611 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:56,642 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:56,673 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:56,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:56,920 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4399707317352295 s; generated tokens: 17 tokens; generate speed: 11.805795510520019 tokens/s +2024-07-30 14:17:56,925 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:56,925 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1329/2067], cost time 1.4511s, every example cost time is 1.4511, generate speed: 11.7154 tokens/s, avg speed: 10.3117 tokens/s, remaining time: 0:16:50 +pred is: + ['Presbyterian Church'] + label is: + ['Presbyterian'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:17:57,008 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:57,008 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 200, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:57,008 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:57,009 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:57,009 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:57,952 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:57,985 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:58,016 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:58,047 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:58,078 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:58,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:58,139 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:58,170 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:58,200 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:58,231 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:58,540 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5311639308929443 s; generated tokens: 20 tokens; generate speed: 13.061958681547832 tokens/s +2024-07-30 14:17:58,545 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:17:58,545 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1330/2067], cost time 1.5425s, every example cost time is 1.5425, generate speed: 12.9658 tokens/s, avg speed: 10.3140 tokens/s, remaining time: 0:16:48 +pred is: + ['7'] + label is: + ['7'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.45187709848982, Em score: 50.526315789473685, current_count: 1330 +2024-07-30 14:17:59,039 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:17:59,039 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 276, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:17:59,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:17:59,040 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:17:59,040 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:17:59,985 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:00,018 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:00,049 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:00,080 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:00,112 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:00,143 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:00,174 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:00,205 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:00,236 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:00,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:00,578 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5379831790924072 s; generated tokens: 20 tokens; generate speed: 13.004043393896138 tokens/s +2024-07-30 14:18:00,583 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:00,584 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1331/2067], cost time 1.5495s, every example cost time is 1.5495, generate speed: 12.9070 tokens/s, avg speed: 10.3162 tokens/s, remaining time: 0:16:47 +pred is: + ['Sonderungsverbot'] + label is: + ['Sonderungsverbot'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:18:00,666 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:00,666 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 146, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:00,667 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:00,667 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:00,667 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:01,610 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:01,642 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:01,673 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:01,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:01,750 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:01,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:01,812 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:01,843 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:01,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:01,905 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:01,969 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3018605709075928 s; generated tokens: 12 tokens; generate speed: 9.217576957288285 tokens/s +2024-07-30 14:18:01,974 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:01,974 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1332/2067], cost time 1.3130s, every example cost time is 1.3130, generate speed: 9.1394 tokens/s, avg speed: 10.3153 tokens/s, remaining time: 0:16:46 +pred is: + ['Ergänzungsschulen'] + label is: + ['Ergänzungsschulen'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:18:02,057 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:02,057 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 236, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:02,057 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:02,058 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:02,058 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:03,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:03,035 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:03,066 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:03,097 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:03,128 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:03,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:03,190 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:03,193 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1350817680358887 s; generated tokens: 7 tokens; generate speed: 6.1669565991819155 tokens/s +2024-07-30 14:18:03,198 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:03,198 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1333/2067], cost time 1.1461s, every example cost time is 1.1461, generate speed: 6.1078 tokens/s, avg speed: 10.3127 tokens/s, remaining time: 0:16:44 +pred is: + ['Unaided independent school'] + label is: + ['independent'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +2024-07-30 14:18:03,281 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:03,281 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 229, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:03,282 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:03,282 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:03,282 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:04,252 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:04,285 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:04,316 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:04,347 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:04,378 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:04,381 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0983445644378662 s; generated tokens: 5 tokens; generate speed: 4.55230549855637 tokens/s +2024-07-30 14:18:04,385 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:04,386 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1334/2067], cost time 1.1094s, every example cost time is 1.1094, generate speed: 4.5071 tokens/s, avg speed: 10.3091 tokens/s, remaining time: 0:16:43 +pred is: + ['Societies'] + label is: + ['societies'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:18:04,468 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:04,468 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 239, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:04,468 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:04,469 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:04,469 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:05,413 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:05,446 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:05,477 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:05,508 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:05,539 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:05,570 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:05,601 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:05,632 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:05,662 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:05,693 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:05,727 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2579848766326904 s; generated tokens: 11 tokens; generate speed: 8.744143275747668 tokens/s +2024-07-30 14:18:05,732 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:05,732 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1335/2067], cost time 1.2691s, every example cost time is 1.2691, generate speed: 8.6676 tokens/s, avg speed: 10.3080 tokens/s, remaining time: 0:16:41 +pred is: + ['scoil phríobháideach'] + label is: + ['scoil phríobháideach'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:18:05,814 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:05,814 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 166, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:05,815 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:05,815 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:05,815 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:06,758 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:06,791 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:06,822 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:06,853 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:06,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:06,914 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:06,945 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:06,976 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:07,006 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:07,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:07,345 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.529127597808838 s; generated tokens: 20 tokens; generate speed: 13.07935323949354 tokens/s +2024-07-30 14:18:07,349 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:07,350 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1336/2067], cost time 1.5403s, every example cost time is 1.5403, generate speed: 12.9843 tokens/s, avg speed: 10.3103 tokens/s, remaining time: 0:16:40 +pred is: + ['1957'] + label is: + ['1957'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:18:07,432 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:07,432 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 217, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:07,432 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:07,433 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:07,433 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:08,376 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:08,410 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:08,442 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:08,473 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:08,504 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:08,536 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:08,567 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:08,598 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:08,601 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1678202152252197 s; generated tokens: 8 tokens; generate speed: 6.850369513818667 tokens/s +2024-07-30 14:18:08,606 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:08,606 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1337/2067], cost time 1.1790s, every example cost time is 1.1790, generate speed: 6.7853 tokens/s, avg speed: 10.3080 tokens/s, remaining time: 0:16:39 +pred is: + ['Aided'] + label is: + ['aided'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:18:08,716 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:08,716 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 262, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:08,717 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:08,717 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:08,717 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:09,662 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:09,695 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:09,726 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:09,757 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:09,788 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:09,819 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:09,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:09,881 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:09,912 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:09,943 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:09,946 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2288081645965576 s; generated tokens: 10 tokens; generate speed: 8.13796676170621 tokens/s +2024-07-30 14:18:09,951 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:09,951 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1338/2067], cost time 1.2405s, every example cost time is 1.2405, generate speed: 8.0614 tokens/s, avg speed: 10.3065 tokens/s, remaining time: 0:16:37 +pred is: + ['88'] + label is: + ['88'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:18:10,033 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:10,034 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 246, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:10,034 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:10,034 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:10,035 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:10,978 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:11,012 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:11,043 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:11,074 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:11,114 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:11,145 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:11,176 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:11,207 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:11,210 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1753110885620117 s; generated tokens: 8 tokens; generate speed: 6.8067085198591695 tokens/s +2024-07-30 14:18:11,215 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:11,215 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1339/2067], cost time 1.1866s, every example cost time is 1.1866, generate speed: 6.7422 tokens/s, avg speed: 10.3042 tokens/s, remaining time: 0:16:36 +pred is: + ['Anglican'] + label is: + ['Anglican'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:18:11,298 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:11,298 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 210, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:11,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:11,299 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:11,299 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:12,243 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:12,275 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:12,306 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:12,337 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:12,368 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:12,399 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:12,431 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:12,463 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:12,493 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:12,524 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:12,527 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2280762195587158 s; generated tokens: 10 tokens; generate speed: 8.14281706683751 tokens/s +2024-07-30 14:18:12,532 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:12,532 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1340/2067], cost time 1.2394s, every example cost time is 1.2394, generate speed: 8.0685 tokens/s, avg speed: 10.3026 tokens/s, remaining time: 0:16:34 +pred is: + ['7.5'] + label is: + ['7.5'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.66741035397374, Em score: 50.82089552238806, current_count: 1340 +2024-07-30 14:18:13,018 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:13,018 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 150, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:13,019 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:13,019 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:13,019 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:13,961 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:13,994 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:14,024 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:14,055 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:14,086 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:14,116 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:14,147 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:14,150 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.130535364151001 s; generated tokens: 7 tokens; generate speed: 6.191756774682405 tokens/s +2024-07-30 14:18:14,155 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:14,155 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1341/2067], cost time 1.1421s, every example cost time is 1.1421, generate speed: 6.1288 tokens/s, avg speed: 10.3000 tokens/s, remaining time: 0:16:33 +pred is: + ['Education Service Contracting scheme'] + label is: + ['Education Service Contracting'] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +2024-07-30 14:18:14,237 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:14,238 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 142, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:14,238 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:14,238 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:14,238 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:15,180 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:15,213 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:15,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:15,275 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:15,306 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:15,337 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:15,368 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:15,399 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:15,430 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:15,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:15,464 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.22501540184021 s; generated tokens: 10 tokens; generate speed: 8.163162671243208 tokens/s +2024-07-30 14:18:15,469 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:15,469 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1342/2067], cost time 1.2366s, every example cost time is 1.2366, generate speed: 8.0868 tokens/s, avg speed: 10.2986 tokens/s, remaining time: 0:16:31 +pred is: + ['South African Schools Act of 1996'] + label is: + ['South African Schools Act'] +The F1/Em of this example is: {'F1': 77.77777777777779, 'Em': 0.0} +2024-07-30 14:18:15,552 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:15,552 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:15,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:15,552 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:15,553 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:16,497 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:16,531 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:16,563 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:16,594 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:16,625 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:16,656 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:16,686 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:16,717 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:16,749 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:16,780 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:17,089 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5358848571777344 s; generated tokens: 20 tokens; generate speed: 13.02180948430666 tokens/s +2024-07-30 14:18:17,094 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:17,094 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1343/2067], cost time 1.5471s, every example cost time is 1.5471, generate speed: 12.9275 tokens/s, avg speed: 10.3008 tokens/s, remaining time: 0:16:30 +pred is: + ['1'] + label is: + ['government schools formerly reserved for white children'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:18:17,176 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:17,176 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 171, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:17,177 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:17,177 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:17,177 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:18,120 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:18,153 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:18,184 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:18,214 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:18,245 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:18,276 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:18,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:18,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:18,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:18,399 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:18,402 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2248821258544922 s; generated tokens: 10 tokens; generate speed: 8.164050882058453 tokens/s +2024-07-30 14:18:18,407 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:18,407 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1344/2067], cost time 1.2360s, every example cost time is 1.2360, generate speed: 8.0907 tokens/s, avg speed: 10.2993 tokens/s, remaining time: 0:16:29 +pred is: + ['10'] + label is: + ['10'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:18:18,490 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:18,490 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 246, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:18,491 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:18,491 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:18,491 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:19,436 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:19,469 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:19,507 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:19,538 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:19,569 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:19,600 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:19,631 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:19,662 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:19,694 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:19,697 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2051806449890137 s; generated tokens: 9 tokens; generate speed: 7.467760154812346 tokens/s +2024-07-30 14:18:19,702 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:19,702 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1345/2067], cost time 1.2167s, every example cost time is 1.2167, generate speed: 7.3973 tokens/s, avg speed: 10.2974 tokens/s, remaining time: 0:16:27 +pred is: + ['13'] + label is: + ['13'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:18:19,784 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:19,784 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 190, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:19,784 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:19,785 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:19,785 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:20,728 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:20,762 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:20,794 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:20,825 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:20,856 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:20,887 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:20,918 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:20,949 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:20,980 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:21,010 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:21,197 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4115071296691895 s; generated tokens: 16 tokens; generate speed: 11.33540147526557 tokens/s +2024-07-30 14:18:21,201 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:21,202 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1346/2067], cost time 1.4229s, every example cost time is 1.4229, generate speed: 11.2447 tokens/s, avg speed: 10.2981 tokens/s, remaining time: 0:16:26 +pred is: + ['Brown v. Board of Education of Topeka'] + label is: + ['Brown v. Board of Education of Topeka'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:18:21,285 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:21,285 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 165, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:21,286 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:21,286 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:21,286 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:22,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:22,265 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:22,296 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:22,327 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:22,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:22,388 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:22,419 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:22,449 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:22,480 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:22,510 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:22,817 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5305595397949219 s; generated tokens: 20 tokens; generate speed: 13.067116619768859 tokens/s +2024-07-30 14:18:22,822 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:22,822 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1347/2067], cost time 1.5421s, every example cost time is 1.5421, generate speed: 12.9696 tokens/s, avg speed: 10.3003 tokens/s, remaining time: 0:16:25 +pred is: + ['1'] + label is: + ['endowments'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:18:22,904 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:22,904 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 183, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:22,905 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:22,905 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:22,905 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:23,849 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:23,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:23,913 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:23,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:23,975 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:24,006 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:24,036 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:24,067 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:24,097 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:24,128 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:24,263 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3579216003417969 s; generated tokens: 14 tokens; generate speed: 10.309873557115608 tokens/s +2024-07-30 14:18:24,268 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:24,269 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1348/2067], cost time 1.3691s, every example cost time is 1.3691, generate speed: 10.2256 tokens/s, avg speed: 10.3003 tokens/s, remaining time: 0:16:23 +pred is: + ['Massachusetts'] + label is: + ['Massachusetts'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:18:24,351 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:24,351 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 174, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:24,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:24,352 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:24,352 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:25,294 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:25,327 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:25,358 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:25,389 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:25,424 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:25,455 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:25,485 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:25,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:25,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:25,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:25,611 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.259326696395874 s; generated tokens: 11 tokens; generate speed: 8.734826341315097 tokens/s +2024-07-30 14:18:25,616 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:25,617 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1349/2067], cost time 1.2705s, every example cost time is 1.2705, generate speed: 8.6580 tokens/s, avg speed: 10.2991 tokens/s, remaining time: 0:16:22 +pred is: + ['40000'] + label is: + ['$40,000'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:18:25,698 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:25,698 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 257, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:25,699 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:25,699 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:25,699 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:26,644 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:26,677 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:26,708 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:26,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:26,770 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:26,801 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:26,832 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:26,863 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:26,893 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:26,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:27,112 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4130501747131348 s; generated tokens: 16 tokens; generate speed: 11.323023262955388 tokens/s +2024-07-30 14:18:27,117 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:27,118 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1350/2067], cost time 1.4243s, every example cost time is 1.4243, generate speed: 11.2335 tokens/s, avg speed: 10.2999 tokens/s, remaining time: 0:16:20 +pred is: + ['John Harvard'] + label is: + ['John Harvard'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.67810443365624, Em score: 50.81481481481482, current_count: 1350 +2024-07-30 14:18:27,603 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:27,603 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 188, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:27,604 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:27,604 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:27,604 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:28,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:28,580 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:28,611 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:28,642 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:28,673 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:28,675 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.071305751800537 s; generated tokens: 5 tokens; generate speed: 4.667201675708854 tokens/s +2024-07-30 14:18:28,680 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:28,680 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1351/2067], cost time 1.0830s, every example cost time is 1.0830, generate speed: 4.6167 tokens/s, avg speed: 10.2965 tokens/s, remaining time: 0:16:19 +pred is: + ['Harvard Library'] + label is: + ['Harvard Library'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:18:28,763 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:28,763 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 169, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:28,763 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:28,764 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:28,764 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:29,707 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:29,740 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:29,772 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:29,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:29,842 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:29,872 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:29,903 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:29,934 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:29,964 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:29,995 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:30,120 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.356539249420166 s; generated tokens: 14 tokens; generate speed: 10.32037960271633 tokens/s +2024-07-30 14:18:30,125 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:30,126 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1352/2067], cost time 1.3677s, every example cost time is 1.3677, generate speed: 10.2359 tokens/s, avg speed: 10.2965 tokens/s, remaining time: 0:16:18 +pred is: + ['Boston'] + label is: + ['Boston metropolitan area'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +2024-07-30 14:18:30,208 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:30,208 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 170, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:30,209 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:30,209 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:30,209 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:31,152 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:31,189 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:31,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:31,252 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:31,282 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:31,313 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:31,344 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:31,375 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:31,406 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:31,436 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:31,653 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4439375400543213 s; generated tokens: 17 tokens; generate speed: 11.773362440151294 tokens/s +2024-07-30 14:18:31,658 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:31,659 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1353/2067], cost time 1.4554s, every example cost time is 1.4554, generate speed: 11.6810 tokens/s, avg speed: 10.2976 tokens/s, remaining time: 0:16:16 +pred is: + ['1636'] + label is: + ['1636'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:18:31,741 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:31,741 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:31,742 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:31,742 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:31,742 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:32,685 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:32,719 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:32,750 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:32,781 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:32,812 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:32,815 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0724186897277832 s; generated tokens: 5 tokens; generate speed: 4.6623581329687305 tokens/s +2024-07-30 14:18:32,820 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:32,820 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1354/2067], cost time 1.0836s, every example cost time is 1.0836, generate speed: 4.6142 tokens/s, avg speed: 10.2943 tokens/s, remaining time: 0:16:15 +pred is: + ['Puritan'] + label is: + ['Puritan ministers'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:18:32,902 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:32,902 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 210, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:32,903 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:32,903 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:32,903 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:33,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:33,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:33,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:33,941 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:33,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:34,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:34,033 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:34,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:34,095 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:34,125 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:34,159 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2552869319915771 s; generated tokens: 11 tokens; generate speed: 8.762936759445058 tokens/s +2024-07-30 14:18:34,163 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:34,164 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1355/2067], cost time 1.2666s, every example cost time is 1.2666, generate speed: 8.6849 tokens/s, avg speed: 10.2932 tokens/s, remaining time: 0:16:13 +pred is: + ['1804'] + label is: + ['1804'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:18:34,246 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:34,246 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 313, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:34,247 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:34,247 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:34,247 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:35,191 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:35,224 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:35,255 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:35,285 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:35,316 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:35,355 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:35,386 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:35,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:35,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:35,479 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:35,575 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3274633884429932 s; generated tokens: 13 tokens; generate speed: 9.793113778639082 tokens/s +2024-07-30 14:18:35,580 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:35,580 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1356/2067], cost time 1.3387s, every example cost time is 1.3387, generate speed: 9.7112 tokens/s, avg speed: 10.2927 tokens/s, remaining time: 0:16:12 +pred is: + ['Louis Agassiz'] + label is: + ['Louis Agassiz'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:18:35,662 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:35,662 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 166, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:35,662 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:35,663 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:35,663 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:36,605 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:36,638 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:36,669 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:36,700 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:36,731 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:36,761 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:36,792 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:36,795 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1317367553710938 s; generated tokens: 7 tokens; generate speed: 6.185183936793426 tokens/s +2024-07-30 14:18:36,800 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:36,800 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1357/2067], cost time 1.1429s, every example cost time is 1.1429, generate speed: 6.1250 tokens/s, avg speed: 10.2902 tokens/s, remaining time: 0:16:10 +pred is: + ['Charles W. Eliot'] + label is: + ['Charles W. Eliot'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:18:36,882 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:36,882 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 181, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:36,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:36,883 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:36,883 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:37,826 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:37,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:37,890 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:37,920 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:37,951 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:37,982 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:37,985 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1016404628753662 s; generated tokens: 6 tokens; generate speed: 5.4464230410886865 tokens/s +2024-07-30 14:18:37,989 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:37,990 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1358/2067], cost time 1.1128s, every example cost time is 1.1128, generate speed: 5.3919 tokens/s, avg speed: 10.2872 tokens/s, remaining time: 0:16:09 +pred is: + ['James Bryant Conant'] + label is: + ['James Bryant Conant'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:18:38,080 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:38,081 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 160, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:38,081 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:38,081 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:38,081 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:39,024 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:39,057 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:39,089 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:39,120 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:39,151 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:39,181 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:39,212 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:39,243 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:39,273 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:39,304 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:39,620 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5380644798278809 s; generated tokens: 20 tokens; generate speed: 13.003356011601104 tokens/s +2024-07-30 14:18:39,625 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:39,625 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1359/2067], cost time 1.5498s, every example cost time is 1.5498, generate speed: 12.9051 tokens/s, avg speed: 10.2894 tokens/s, remaining time: 0:16:08 +pred is: + ['4:1'] + label is: + ['about four men attending Harvard College for every woman studying at Radcliffe'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:18:39,708 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:39,709 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 255, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:39,709 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:39,709 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:39,710 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:40,654 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:40,687 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:40,722 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:40,754 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:40,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:40,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:40,846 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:40,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:40,882 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1717920303344727 s; generated tokens: 8 tokens; generate speed: 6.8271500342228 tokens/s +2024-07-30 14:18:40,886 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:40,887 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1360/2067], cost time 1.1832s, every example cost time is 1.1832, generate speed: 6.7610 tokens/s, avg speed: 10.2872 tokens/s, remaining time: 0:16:06 +pred is: + ['3 miles (5 km)'] + label is: + ['3 miles'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +F1 score: 64.74174582262445, Em score: 50.88235294117647, current_count: 1360 +2024-07-30 14:18:41,364 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:41,364 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:41,365 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:41,365 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:41,365 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:42,308 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:42,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:42,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:42,403 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:42,434 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:42,465 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:42,496 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:42,526 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:42,557 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:42,587 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:42,898 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5325968265533447 s; generated tokens: 20 tokens; generate speed: 13.049746452221212 tokens/s +2024-07-30 14:18:42,903 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:42,904 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1361/2067], cost time 1.5448s, every example cost time is 1.5448, generate speed: 12.9471 tokens/s, avg speed: 10.2894 tokens/s, remaining time: 0:16:05 +pred is: + ['Allston'] + label is: + ['Allston'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:18:42,986 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:42,986 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 217, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:42,987 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:42,987 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:42,987 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:43,930 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:43,963 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:43,995 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:44,026 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:44,029 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0416207313537598 s; generated tokens: 4 tokens; generate speed: 3.8401693434051887 tokens/s +2024-07-30 14:18:44,034 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:44,034 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1362/2067], cost time 1.0530s, every example cost time is 1.0530, generate speed: 3.7986 tokens/s, avg speed: 10.2857 tokens/s, remaining time: 0:16:03 +pred is: + ['50%'] + label is: + ['approximately fifty percent'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:18:44,116 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:44,117 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 200, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:44,117 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:44,117 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:44,118 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:45,061 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:45,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:45,125 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:45,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:45,186 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:45,189 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0710444450378418 s; generated tokens: 5 tokens; generate speed: 4.668340350547584 tokens/s +2024-07-30 14:18:45,193 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:45,194 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1363/2067], cost time 1.0822s, every example cost time is 1.0822, generate speed: 4.6204 tokens/s, avg speed: 10.2824 tokens/s, remaining time: 0:16:02 +pred is: + ['2,400'] + label is: + ['2,400'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:18:45,283 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:45,284 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 306, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:45,284 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:45,284 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:45,285 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:46,230 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:46,263 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:46,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:46,325 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:46,356 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:46,387 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:46,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:46,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:46,479 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:46,510 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:46,605 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3197829723358154 s; generated tokens: 13 tokens; generate speed: 9.850104352378462 tokens/s +2024-07-30 14:18:46,609 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:46,610 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1364/2067], cost time 1.3313s, every example cost time is 1.3313, generate speed: 9.7650 tokens/s, avg speed: 10.2820 tokens/s, remaining time: 0:16:00 +pred is: + ['32 billion'] + label is: + ['$32 billion'] +The F1/Em of this example is: {'F1': 85.71428571428571, 'Em': 0.0} +2024-07-30 14:18:46,691 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:46,692 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 166, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:46,692 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:46,692 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:46,692 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:47,635 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:47,668 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:47,699 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:47,729 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:47,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:47,790 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:47,822 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:47,852 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:47,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:47,914 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:48,226 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5332458019256592 s; generated tokens: 20 tokens; generate speed: 13.044222899473308 tokens/s +2024-07-30 14:18:48,231 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:48,231 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1365/2067], cost time 1.5445s, every example cost time is 1.5445, generate speed: 12.9496 tokens/s, avg speed: 10.2843 tokens/s, remaining time: 0:15:59 +pred is: + ['1980s'] + label is: + ['late 1980s'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:18:48,313 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:48,313 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 151, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:48,314 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:48,314 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:48,314 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:49,256 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:49,289 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:49,320 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:49,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:49,382 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:49,412 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:49,415 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1008739471435547 s; generated tokens: 6 tokens; generate speed: 5.45021527266427 tokens/s +2024-07-30 14:18:49,420 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:49,420 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1366/2067], cost time 1.1120s, every example cost time is 1.1120, generate speed: 5.3955 tokens/s, avg speed: 10.2813 tokens/s, remaining time: 0:15:58 +pred is: + ['5.3%'] + label is: + ['accepted 5.3% of applicants'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 14:18:49,503 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:49,503 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 252, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:49,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:49,504 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:49,504 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:50,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:50,481 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:50,513 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:50,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:50,574 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:50,605 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:50,636 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:50,666 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:50,697 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:50,728 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:50,730 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2263109683990479 s; generated tokens: 10 tokens; generate speed: 8.154538496100239 tokens/s +2024-07-30 14:18:50,735 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:50,735 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1367/2067], cost time 1.2375s, every example cost time is 1.2375, generate speed: 8.0806 tokens/s, avg speed: 10.2799 tokens/s, remaining time: 0:15:56 +pred is: + ['7'] + label is: + ['core curriculum of seven classes'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:18:50,818 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:50,818 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 298, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:50,819 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:50,819 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:50,819 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:51,764 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:51,797 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:51,828 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:51,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:51,890 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:51,921 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:51,952 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:51,982 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:52,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:52,044 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:52,046 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2269959449768066 s; generated tokens: 10 tokens; generate speed: 8.149986184501225 tokens/s +2024-07-30 14:18:52,051 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:52,051 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1368/2067], cost time 1.2383s, every example cost time is 1.2383, generate speed: 8.0755 tokens/s, avg speed: 10.2784 tokens/s, remaining time: 0:15:55 +pred is: + ['8'] + label is: + ['beginning in early September and ending in mid-May'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:18:52,134 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:52,134 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 231, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:52,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:52,135 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:52,135 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:53,079 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:53,113 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:53,144 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:53,174 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:53,205 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:53,208 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0730855464935303 s; generated tokens: 5 tokens; generate speed: 4.6594607637184735 tokens/s +2024-07-30 14:18:53,213 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:53,213 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1369/2067], cost time 1.0843s, every example cost time is 1.0843, generate speed: 4.6113 tokens/s, avg speed: 10.2751 tokens/s, remaining time: 0:15:53 +pred is: + ['38,000'] + label is: + ['$38,000'] +The F1/Em of this example is: {'F1': 85.71428571428571, 'Em': 0.0} +2024-07-30 14:18:53,296 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:53,296 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 241, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:53,296 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:53,297 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:53,297 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:54,241 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:54,274 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:54,306 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:54,337 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:54,368 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:54,399 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:54,430 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:54,461 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:54,493 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:54,523 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:54,830 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5334515571594238 s; generated tokens: 20 tokens; generate speed: 13.042472653683392 tokens/s +2024-07-30 14:18:54,835 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:54,836 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1370/2067], cost time 1.5448s, every example cost time is 1.5448, generate speed: 12.9463 tokens/s, avg speed: 10.2773 tokens/s, remaining time: 0:15:52 +pred is: + ['Widener Library'] + label is: + ['Widener Library'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.66803130671374, Em score: 50.72992700729927, current_count: 1370 +2024-07-30 14:18:55,316 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:55,317 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 247, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:55,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:55,317 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:55,318 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:56,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:56,294 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:56,325 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:56,356 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:56,387 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:56,418 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:56,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:56,479 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:56,510 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:56,540 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:56,849 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5316767692565918 s; generated tokens: 20 tokens; generate speed: 13.057585256520614 tokens/s +2024-07-30 14:18:56,855 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:56,855 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1371/2067], cost time 1.5433s, every example cost time is 1.5433, generate speed: 12.9589 tokens/s, avg speed: 10.2796 tokens/s, remaining time: 0:15:51 +pred is: + ['3'] + label is: + ['three museums.'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:18:56,937 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:56,938 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 298, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:56,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:56,938 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:56,938 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:57,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:57,917 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:57,948 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:57,978 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:58,009 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:58,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:58,071 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:58,102 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:58,133 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:58,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:58,472 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.533431053161621 s; generated tokens: 20 tokens; generate speed: 13.042647048763028 tokens/s +2024-07-30 14:18:58,477 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:58,477 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1372/2067], cost time 1.5446s, every example cost time is 1.5446, generate speed: 12.9482 tokens/s, avg speed: 10.2817 tokens/s, remaining time: 0:15:49 +pred is: + ['2003'] + label is: + ['2003'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:18:58,560 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:58,560 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 151, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:58,561 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:58,561 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:58,561 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:18:59,504 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:59,540 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:59,572 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:59,575 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0135304927825928 s; generated tokens: 3 tokens; generate speed: 2.959950412309415 tokens/s +2024-07-30 14:18:59,580 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:18:59,580 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1373/2067], cost time 1.0249s, every example cost time is 1.0249, generate speed: 2.9272 tokens/s, avg speed: 10.2777 tokens/s, remaining time: 0:15:48 +pred is: + ['42'] + label is: + ['42'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:18:59,662 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:18:59,662 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 281, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:18:59,662 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:18:59,663 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:18:59,663 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:00,607 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:00,640 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:00,672 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:00,703 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:00,733 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:00,764 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:00,795 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:00,826 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:00,857 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:00,860 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1969549655914307 s; generated tokens: 9 tokens; generate speed: 7.519079880798176 tokens/s +2024-07-30 14:19:00,865 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:00,865 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1374/2067], cost time 1.2081s, every example cost time is 1.2081, generate speed: 7.4500 tokens/s, avg speed: 10.2759 tokens/s, remaining time: 0:15:46 +pred is: + ['1875'] + label is: + ['1875'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:19:00,947 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:00,947 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 204, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:00,948 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:00,948 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:00,948 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:01,891 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:01,931 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:01,963 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:01,994 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:02,025 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:02,056 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:02,086 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:02,117 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:02,147 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:02,178 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:02,484 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5358567237854004 s; generated tokens: 20 tokens; generate speed: 13.022048014157424 tokens/s +2024-07-30 14:19:02,489 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:02,489 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1375/2067], cost time 1.5471s, every example cost time is 1.5471, generate speed: 12.9274 tokens/s, avg speed: 10.2781 tokens/s, remaining time: 0:15:45 +pred is: + ['Lavietes Pavilion'] + label is: + ['Lavietes Pavilion'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:19:02,572 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:02,572 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 182, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:02,573 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:02,573 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:02,573 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:03,517 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:03,550 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:03,582 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:03,613 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:03,643 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:03,674 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:03,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:03,735 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:03,738 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.164543867111206 s; generated tokens: 8 tokens; generate speed: 6.869642463400697 tokens/s +2024-07-30 14:19:03,742 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:03,743 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1376/2067], cost time 1.1756s, every example cost time is 1.1756, generate speed: 6.8053 tokens/s, avg speed: 10.2759 tokens/s, remaining time: 0:15:44 +pred is: + ['23'] + label is: + ['23 years'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:19:03,825 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:03,825 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 308, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:03,825 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:03,826 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:03,826 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:04,771 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:04,804 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:04,835 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:04,866 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:04,897 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:04,928 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:04,958 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:04,989 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:05,020 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:05,051 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:05,114 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.288163661956787 s; generated tokens: 12 tokens; generate speed: 9.315586485160884 tokens/s +2024-07-30 14:19:05,119 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:05,119 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1377/2067], cost time 1.2993s, every example cost time is 1.2993, generate speed: 9.2359 tokens/s, avg speed: 10.2752 tokens/s, remaining time: 0:15:42 +pred is: + ['Ban Ki-moon'] + label is: + ['General Ban Ki-moon'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:19:05,201 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:05,201 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 329, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:05,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:05,202 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:05,202 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:06,148 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:06,181 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:06,212 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:06,243 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:06,274 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:06,305 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:06,336 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:06,368 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:06,399 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:06,402 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1992018222808838 s; generated tokens: 9 tokens; generate speed: 7.504991931117971 tokens/s +2024-07-30 14:19:06,407 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:06,407 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1378/2067], cost time 1.2104s, every example cost time is 1.2104, generate speed: 7.4358 tokens/s, avg speed: 10.2734 tokens/s, remaining time: 0:15:41 +pred is: + ["Conan O'Brien"] + label is: + ["Conan O'Brien"] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:19:06,490 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:06,490 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 250, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:06,490 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:06,491 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:06,491 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:07,435 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:07,469 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:07,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:07,530 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:07,561 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:07,592 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:07,623 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:07,653 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:07,684 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:07,715 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:07,810 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3187119960784912 s; generated tokens: 13 tokens; generate speed: 9.858103997429795 tokens/s +2024-07-30 14:19:07,815 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:07,815 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1379/2067], cost time 1.3304s, every example cost time is 1.3304, generate speed: 9.7717 tokens/s, avg speed: 10.2730 tokens/s, remaining time: 0:15:40 +pred is: + ['Shing-Tung Yau'] + label is: + ['Shing-Tung Yau'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:19:07,896 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:07,897 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 180, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:07,897 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:07,897 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:07,898 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:08,841 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:08,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:08,876 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 0.9786703586578369 s; generated tokens: 2 tokens; generate speed: 2.0435890208658507 tokens/s +2024-07-30 14:19:08,881 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:08,881 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1380/2067], cost time 0.9897s, every example cost time is 0.9897, generate speed: 2.0209 tokens/s, avg speed: 10.2687 tokens/s, remaining time: 0:15:38 +pred is: + ['Jacksonville'] + label is: + ['Jacksonville'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.79724847115786, Em score: 50.869565217391305, current_count: 1380 +2024-07-30 14:19:09,364 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:09,364 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 234, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:09,365 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:09,365 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:09,365 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:10,309 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:10,344 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:10,375 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:10,406 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:10,437 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:10,467 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:10,470 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1047353744506836 s; generated tokens: 6 tokens; generate speed: 5.431164909500095 tokens/s +2024-07-30 14:19:10,475 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:10,475 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1381/2067], cost time 1.1166s, every example cost time is 1.1166, generate speed: 5.3733 tokens/s, avg speed: 10.2658 tokens/s, remaining time: 0:15:36 +pred is: + ['St. Johns River'] + label is: + ['St. Johns'] +The F1/Em of this example is: {'F1': 80.0, 'Em': 0.0} +2024-07-30 14:19:10,557 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:10,558 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 190, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:10,558 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:10,558 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:10,558 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:11,502 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:11,535 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:11,566 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:11,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:11,628 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:11,659 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:11,690 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:11,721 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:11,752 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:11,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:12,092 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5330188274383545 s; generated tokens: 20 tokens; generate speed: 13.046154190695507 tokens/s +2024-07-30 14:19:12,096 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:12,097 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1382/2067], cost time 1.5444s, every example cost time is 1.5444, generate speed: 12.9501 tokens/s, avg speed: 10.2680 tokens/s, remaining time: 0:15:35 +pred is: + ['3'] + label is: + ['third largest'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:19:12,179 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:12,180 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 220, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:12,180 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:12,180 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:12,180 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:13,124 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:13,157 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:13,188 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:13,219 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:13,250 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:13,281 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:13,312 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:13,343 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:13,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:13,404 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:13,407 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.226050853729248 s; generated tokens: 10 tokens; generate speed: 8.156268534525507 tokens/s +2024-07-30 14:19:13,411 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:13,412 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1383/2067], cost time 1.2375s, every example cost time is 1.2375, generate speed: 8.0811 tokens/s, avg speed: 10.2666 tokens/s, remaining time: 0:15:34 +pred is: + ['2500'] + label is: + ['thousands'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:19:13,494 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:13,494 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 267, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:13,495 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:13,495 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:13,495 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:14,439 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:14,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:14,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:14,534 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:14,565 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:14,595 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:14,626 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:14,657 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:14,692 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:14,724 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:14,757 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2620275020599365 s; generated tokens: 11 tokens; generate speed: 8.716133350537385 tokens/s +2024-07-30 14:19:14,762 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:14,762 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1384/2067], cost time 1.2732s, every example cost time is 1.2732, generate speed: 8.6397 tokens/s, avg speed: 10.2655 tokens/s, remaining time: 0:15:32 +pred is: + ['Jean Ribault'] + label is: + ['Jean Ribault'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:19:14,844 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:14,845 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 292, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:14,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:14,845 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:14,845 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:15,790 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:15,823 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:15,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:15,885 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:15,920 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:15,951 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:15,982 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:16,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:16,043 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:16,075 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:16,170 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3240303993225098 s; generated tokens: 13 tokens; generate speed: 9.818505682839263 tokens/s +2024-07-30 14:19:16,174 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:16,175 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1385/2067], cost time 1.3352s, every example cost time is 1.3352, generate speed: 9.7364 tokens/s, avg speed: 10.2651 tokens/s, remaining time: 0:15:31 +pred is: + ['French and Indian War'] + label is: + ['French and Indian War'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:19:16,257 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:16,257 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 222, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:16,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:16,258 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:16,258 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:17,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:17,236 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:17,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:17,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:17,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:17,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:17,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:17,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:17,454 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:17,490 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:17,616 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3574769496917725 s; generated tokens: 14 tokens; generate speed: 10.313250625123931 tokens/s +2024-07-30 14:19:17,621 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:17,621 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1386/2067], cost time 1.3686s, every example cost time is 1.3686, generate speed: 10.2291 tokens/s, avg speed: 10.2651 tokens/s, remaining time: 0:15:30 +pred is: + ['1'] + label is: + ['Confederate'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:19:17,703 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:17,703 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 195, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:17,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:17,704 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:17,704 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:18,648 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:18,681 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:18,712 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:18,743 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:18,774 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:18,804 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:18,835 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:18,866 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:18,897 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:18,928 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:19,250 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5452451705932617 s; generated tokens: 20 tokens; generate speed: 12.942929950929052 tokens/s +2024-07-30 14:19:19,255 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:19,255 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1387/2067], cost time 1.5565s, every example cost time is 1.5565, generate speed: 12.8494 tokens/s, avg speed: 10.2672 tokens/s, remaining time: 0:15:28 +pred is: + ['1'] + label is: + ['Gilded Age'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:19:19,337 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:19,337 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 307, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:19,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:19,338 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:19,338 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:20,283 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:20,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:20,348 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:20,379 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:20,410 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:20,441 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:20,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:20,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:20,534 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:20,537 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1982817649841309 s; generated tokens: 9 tokens; generate speed: 7.5107543676250375 tokens/s +2024-07-30 14:19:20,542 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:20,542 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1388/2067], cost time 1.2095s, every example cost time is 1.2095, generate speed: 7.4413 tokens/s, avg speed: 10.2654 tokens/s, remaining time: 0:15:27 +pred is: + ['Spanish moss'] + label is: + ['Spanish moss'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:19:20,624 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:20,624 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 157, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:20,624 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:20,625 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:20,625 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:21,568 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:21,601 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:21,632 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:21,663 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:21,693 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:21,724 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:21,754 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:21,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:21,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:21,846 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:22,156 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5314805507659912 s; generated tokens: 20 tokens; generate speed: 13.059258238700272 tokens/s +2024-07-30 14:19:22,161 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:22,162 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1389/2067], cost time 1.5427s, every example cost time is 1.5427, generate speed: 12.9640 tokens/s, avg speed: 10.2676 tokens/s, remaining time: 0:15:26 +pred is: + ['Filmmakers'] + label is: + ['New York–based filmmakers'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 14:19:22,245 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:22,245 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 218, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:22,245 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:22,246 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:22,246 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:23,189 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:23,222 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:23,253 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:23,284 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:23,314 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:23,345 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:23,375 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:23,406 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:23,437 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:23,468 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:23,776 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5303542613983154 s; generated tokens: 20 tokens; generate speed: 13.068869414409706 tokens/s +2024-07-30 14:19:23,781 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:23,781 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1390/2067], cost time 1.5417s, every example cost time is 1.5417, generate speed: 12.9731 tokens/s, avg speed: 10.2698 tokens/s, remaining time: 0:15:24 +pred is: + ['The construction of highways'] + label is: + ['highways'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +F1 score: 64.64043373395528, Em score: 50.719424460431654, current_count: 1390 +2024-07-30 14:19:24,302 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:24,302 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 157, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:24,303 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:24,303 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:24,303 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:25,246 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:25,279 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:25,310 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:25,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:25,371 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:25,402 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:25,433 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:25,463 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:25,494 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:25,524 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:25,832 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5283710956573486 s; generated tokens: 20 tokens; generate speed: 13.085827163852539 tokens/s +2024-07-30 14:19:25,837 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:25,837 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1391/2067], cost time 1.5405s, every example cost time is 1.5405, generate speed: 12.9825 tokens/s, avg speed: 10.2720 tokens/s, remaining time: 0:15:23 +pred is: + ["The city's tax base dissipated"] + label is: + ["Much of the city's tax base dissipated"] +The F1/Em of this example is: {'F1': 84.6153846153846, 'Em': 0.0} +2024-07-30 14:19:25,920 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:25,920 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 222, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:25,921 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:25,921 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:25,921 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:26,864 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:26,897 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:26,928 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:26,959 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:27,014 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:27,045 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:27,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:27,106 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:27,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:27,169 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:27,480 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.559159517288208 s; generated tokens: 20 tokens; generate speed: 12.827423864099105 tokens/s +2024-07-30 14:19:27,485 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:27,486 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1392/2067], cost time 1.5707s, every example cost time is 1.5707, generate speed: 12.7330 tokens/s, avg speed: 10.2740 tokens/s, remaining time: 0:15:22 +pred is: + ['Through the traditional old boy network'] + label is: + ['old boy network'] +The F1/Em of this example is: {'F1': 62.5, 'Em': 0.0} +2024-07-30 14:19:27,568 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:27,568 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 225, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:27,569 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:27,569 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:27,569 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:28,513 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:28,546 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:28,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:28,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:28,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:28,670 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:28,700 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:28,731 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:28,762 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:28,793 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:29,132 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5628836154937744 s; generated tokens: 20 tokens; generate speed: 12.796858193232282 tokens/s +2024-07-30 14:19:29,137 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:29,137 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1393/2067], cost time 1.5742s, every example cost time is 1.5742, generate speed: 12.7052 tokens/s, avg speed: 10.2760 tokens/s, remaining time: 0:15:21 +pred is: + ['Voters approved the plan'] + label is: + ['voters approved the plan'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:19:29,220 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:29,220 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 214, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:29,220 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:29,221 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:29,221 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:30,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:30,197 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:30,228 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:30,259 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:30,290 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:30,321 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:30,352 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:30,382 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:30,413 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:30,444 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:30,755 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5336034297943115 s; generated tokens: 20 tokens; generate speed: 13.041181058575502 tokens/s +2024-07-30 14:19:30,759 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:30,760 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1394/2067], cost time 1.5450s, every example cost time is 1.5450, generate speed: 12.9453 tokens/s, avg speed: 10.2782 tokens/s, remaining time: 0:15:19 +pred is: + ['757.7'] + label is: + ['874.3 square miles'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:19:30,843 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:30,843 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 169, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:30,843 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:30,844 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:30,844 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:31,787 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:31,821 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:31,852 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:31,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:31,914 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:31,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:31,975 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:32,006 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:32,036 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:32,067 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:32,374 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.529951810836792 s; generated tokens: 20 tokens; generate speed: 13.072307152642408 tokens/s +2024-07-30 14:19:32,379 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:32,379 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1395/2067], cost time 1.5415s, every example cost time is 1.5415, generate speed: 12.9741 tokens/s, avg speed: 10.2804 tokens/s, remaining time: 0:15:18 +pred is: + ["It is the tallest building in Downtown Jacksonville's skyline."] + label is: + ['tallest building in Downtown Jacksonville'] +The F1/Em of this example is: {'F1': 62.06896551724138, 'Em': 0.0} +2024-07-30 14:19:32,461 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:32,462 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 160, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:32,462 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:32,462 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:32,463 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:33,405 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:33,459 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:33,490 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:33,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:33,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:33,582 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:33,585 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1224546432495117 s; generated tokens: 6 tokens; generate speed: 5.345427573474123 tokens/s +2024-07-30 14:19:33,590 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:33,590 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1396/2067], cost time 1.1336s, every example cost time is 1.1336, generate speed: 5.2928 tokens/s, avg speed: 10.2774 tokens/s, remaining time: 0:15:16 +pred is: + ['Humid subtropical'] + label is: + ['subtropical'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:19:33,673 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:33,673 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 181, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:33,673 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:33,674 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:33,674 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:34,617 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:34,650 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:34,681 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:34,712 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:34,742 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:34,745 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0713222026824951 s; generated tokens: 5 tokens; generate speed: 4.667130007648909 tokens/s +2024-07-30 14:19:34,750 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:34,750 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1397/2067], cost time 1.0824s, every example cost time is 1.0824, generate speed: 4.6194 tokens/s, avg speed: 10.2742 tokens/s, remaining time: 0:15:15 +pred is: + ['104 °F'] + label is: + ['104 °F'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:19:34,833 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:34,833 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 384, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:34,833 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:34,834 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:34,834 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:35,780 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:35,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:35,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:35,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:35,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:35,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:35,969 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:35,999 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:36,030 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:36,061 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:36,371 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5365862846374512 s; generated tokens: 20 tokens; generate speed: 13.015865233184016 tokens/s +2024-07-30 14:19:36,375 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:36,376 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1398/2067], cost time 1.5479s, every example cost time is 1.5479, generate speed: 12.9204 tokens/s, avg speed: 10.2763 tokens/s, remaining time: 0:15:14 +pred is: + ['Hurricane Dora'] + label is: + ['Hurricane Dora'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:19:36,459 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:36,459 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 168, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:36,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:36,460 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:36,460 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:37,403 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:37,436 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:37,467 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:37,497 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:37,528 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:37,559 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:37,590 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:37,622 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:37,653 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:37,684 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:37,992 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5316567420959473 s; generated tokens: 20 tokens; generate speed: 13.05775599083097 tokens/s +2024-07-30 14:19:37,997 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:37,997 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1399/2067], cost time 1.5432s, every example cost time is 1.5432, generate speed: 12.9598 tokens/s, avg speed: 10.2785 tokens/s, remaining time: 0:15:12 +pred is: + ['Arab'] + label is: + ['Arab'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:19:38,080 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:38,081 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 298, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:38,081 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:38,081 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:38,081 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:39,027 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:39,059 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:39,091 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:39,121 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:39,152 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:39,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:39,185 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1036818027496338 s; generated tokens: 6 tokens; generate speed: 5.436349485016451 tokens/s +2024-07-30 14:19:39,190 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:39,190 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1400/2067], cost time 1.1148s, every example cost time is 1.1148, generate speed: 5.3823 tokens/s, avg speed: 10.2756 tokens/s, remaining time: 0:15:11 +pred is: + ['29.7%'] + label is: + ['29.7%'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.72099088595033, Em score: 50.714285714285715, current_count: 1400 +2024-07-30 14:19:39,708 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:39,708 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 526, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:39,709 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:39,709 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:39,709 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:40,657 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:40,690 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:40,721 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:40,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:40,784 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:40,815 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:40,846 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:40,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:40,909 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:40,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:41,271 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5620675086975098 s; generated tokens: 20 tokens; generate speed: 12.803543949695548 tokens/s +2024-07-30 14:19:41,276 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:41,277 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1401/2067], cost time 1.5738s, every example cost time is 1.5738, generate speed: 12.7078 tokens/s, avg speed: 10.2776 tokens/s, remaining time: 0:15:10 +pred is: + ['40'] + label is: + ['40%'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:19:41,359 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:41,359 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 168, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:41,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:41,360 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:41,360 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:42,303 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:42,335 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:42,366 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:42,370 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0095958709716797 s; generated tokens: 3 tokens; generate speed: 2.9714860037142063 tokens/s +2024-07-30 14:19:42,374 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:42,375 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1402/2067], cost time 1.0209s, every example cost time is 1.0209, generate speed: 2.9386 tokens/s, avg speed: 10.2737 tokens/s, remaining time: 0:15:08 +pred is: + ['400'] + label is: + ['400'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:19:42,456 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:42,456 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 141, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:42,457 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:42,457 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:42,457 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:43,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:43,432 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:43,463 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:43,494 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:43,524 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:43,555 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:43,586 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:43,616 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:43,647 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:43,677 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:43,983 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5259742736816406 s; generated tokens: 20 tokens; generate speed: 13.1063808511968 tokens/s +2024-07-30 14:19:43,988 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:43,988 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1403/2067], cost time 1.5372s, every example cost time is 1.5372, generate speed: 13.0105 tokens/s, avg speed: 10.2759 tokens/s, remaining time: 0:15:07 +pred is: + ['Neoclassical economics'] + label is: + ['Neoclassical economics'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:19:44,103 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:44,103 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 164, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:44,103 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:44,104 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:44,104 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:45,047 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:45,079 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:45,110 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:45,141 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:45,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:45,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:45,232 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:45,263 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:45,294 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:45,325 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:45,512 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4075260162353516 s; generated tokens: 16 tokens; generate speed: 11.367463063165612 tokens/s +2024-07-30 14:19:45,516 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:45,517 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1404/2067], cost time 1.4192s, every example cost time is 1.4192, generate speed: 11.2737 tokens/s, avg speed: 10.2767 tokens/s, remaining time: 0:15:06 +pred is: + ['The substitution of capital equipment for labor (mechanization and automation)'] + label is: + ['reduce costs and maximize profits'] +The F1/Em of this example is: {'F1': 20.0, 'Em': 0.0} +2024-07-30 14:19:45,599 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:45,599 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 285, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:45,600 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:45,600 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:45,600 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:46,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:46,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:46,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:46,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:46,670 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:46,700 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:46,731 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:46,762 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:46,793 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:46,824 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:47,135 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5343501567840576 s; generated tokens: 20 tokens; generate speed: 13.03483426620119 tokens/s +2024-07-30 14:19:47,140 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:47,140 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1405/2067], cost time 1.5456s, every example cost time is 1.5456, generate speed: 12.9396 tokens/s, avg speed: 10.2788 tokens/s, remaining time: 0:15:04 +pred is: + ['Wages'] + label is: + ['workers wages'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:19:47,224 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:47,225 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 281, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:47,225 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:47,225 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:47,226 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:48,170 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:48,203 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:48,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:48,264 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:48,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:48,326 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:48,328 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1027913093566895 s; generated tokens: 6 tokens; generate speed: 5.440739285024004 tokens/s +2024-07-30 14:19:48,333 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:48,334 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1406/2067], cost time 1.1144s, every example cost time is 1.1144, generate speed: 5.3841 tokens/s, avg speed: 10.2760 tokens/s, remaining time: 0:15:03 +pred is: + ['Competition amongst employers'] + label is: + ['Competition amongst workers'] +The F1/Em of this example is: {'F1': 80.00000000000001, 'Em': 0.0} +2024-07-30 14:19:48,416 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:48,417 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 176, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:48,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:48,417 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:48,417 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:49,361 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:49,394 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:49,425 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:49,470 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:49,501 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:49,533 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:49,564 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:49,567 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1492767333984375 s; generated tokens: 7 tokens; generate speed: 6.0907871851724 tokens/s +2024-07-30 14:19:49,572 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:49,572 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1407/2067], cost time 1.1605s, every example cost time is 1.1605, generate speed: 6.0317 tokens/s, avg speed: 10.2734 tokens/s, remaining time: 0:15:01 +pred is: + ['Necessity-based entrepreneurship'] + label is: + ['entrepreneurship rates'] +The F1/Em of this example is: {'F1': 33.33333333333333, 'Em': 0.0} +2024-07-30 14:19:49,655 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:49,655 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 196, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:49,656 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:49,656 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:49,656 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:50,600 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:50,633 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:50,665 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:50,695 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:50,726 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:50,757 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:50,788 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:50,818 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:50,849 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:50,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:51,127 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4711477756500244 s; generated tokens: 18 tokens; generate speed: 12.235344605029042 tokens/s +2024-07-30 14:19:51,132 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:51,133 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1408/2067], cost time 1.4825s, every example cost time is 1.4825, generate speed: 12.1416 tokens/s, avg speed: 10.2749 tokens/s, remaining time: 0:15:00 +pred is: + ['1'] + label is: + ['progressive tax'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:19:51,215 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:51,215 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 180, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:51,216 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:51,216 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:51,216 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:52,158 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:52,191 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:52,222 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:52,253 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:52,284 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:52,314 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:52,345 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:52,376 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:52,407 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:52,437 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:52,745 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5290017127990723 s; generated tokens: 20 tokens; generate speed: 13.080430082309674 tokens/s +2024-07-30 14:19:52,750 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:52,750 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1409/2067], cost time 1.5401s, every example cost time is 1.5401, generate speed: 12.9859 tokens/s, avg speed: 10.2770 tokens/s, remaining time: 0:14:59 +pred is: + ['Education'] + label is: + ['access to education'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +2024-07-30 14:19:52,832 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:52,833 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 164, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:52,833 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:52,833 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:52,833 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:53,776 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:53,809 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:53,840 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:53,871 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:53,902 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:53,933 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:53,936 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1019260883331299 s; generated tokens: 6 tokens; generate speed: 5.445011297514633 tokens/s +2024-07-30 14:19:53,940 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:53,941 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1410/2067], cost time 1.1130s, every example cost time is 1.1130, generate speed: 5.3907 tokens/s, avg speed: 10.2742 tokens/s, remaining time: 0:14:57 +pred is: + ['Increasing access to education'] + label is: + ['increasing access to education'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.6284070262391, Em score: 50.56737588652482, current_count: 1410 +2024-07-30 14:19:54,444 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:54,444 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 243, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:54,444 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:54,445 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:54,445 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:55,388 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:55,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:55,452 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:55,483 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:55,514 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:55,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:55,575 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:55,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:55,637 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:55,668 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:55,792 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3471109867095947 s; generated tokens: 14 tokens; generate speed: 10.392610659494286 tokens/s +2024-07-30 14:19:55,797 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:55,797 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1411/2067], cost time 1.3586s, every example cost time is 1.3586, generate speed: 10.3047 tokens/s, avg speed: 10.2742 tokens/s, remaining time: 0:14:56 +pred is: + ['1910-1940'] + label is: + ['1910–1940'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:19:55,879 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:55,880 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 235, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:55,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:55,880 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:55,881 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:56,825 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:56,858 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:56,888 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:56,919 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:56,950 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:56,981 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:57,011 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:57,042 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:57,073 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:57,104 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:57,412 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5311965942382812 s; generated tokens: 20 tokens; generate speed: 13.061680045043024 tokens/s +2024-07-30 14:19:57,417 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:57,417 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1412/2067], cost time 1.5424s, every example cost time is 1.5424, generate speed: 12.9671 tokens/s, avg speed: 10.2764 tokens/s, remaining time: 0:14:55 +pred is: + ['Unions'] + label is: + ['unions'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:19:57,499 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:57,500 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 163, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:57,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:57,500 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:57,501 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:19:58,443 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:58,476 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:58,507 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:58,538 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:58,569 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:58,600 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:58,631 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:58,662 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:58,692 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:58,723 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:58,969 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4686107635498047 s; generated tokens: 18 tokens; generate speed: 12.256481054579695 tokens/s +2024-07-30 14:19:58,974 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:19:58,974 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1413/2067], cost time 1.4799s, every example cost time is 1.4799, generate speed: 12.1629 tokens/s, avg speed: 10.2778 tokens/s, remaining time: 0:14:53 +pred is: + ['Sweden'] + label is: + ['Scandinavia'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:19:59,056 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:19:59,057 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 324, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:19:59,057 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:19:59,057 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:19:59,058 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:00,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:00,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:00,068 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:00,099 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:00,130 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:00,161 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:00,192 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:00,222 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:00,253 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:00,284 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:00,593 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5353631973266602 s; generated tokens: 20 tokens; generate speed: 13.0262338154409 tokens/s +2024-07-30 14:20:00,598 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:00,598 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1414/2067], cost time 1.5465s, every example cost time is 1.5465, generate speed: 12.9321 tokens/s, avg speed: 10.2799 tokens/s, remaining time: 0:14:52 +pred is: + ['A'] + label is: + ['reduced wages'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:20:00,680 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:00,681 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 202, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:00,681 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:00,681 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:00,681 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:01,625 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:01,658 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:01,689 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:01,720 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:01,722 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0406677722930908 s; generated tokens: 4 tokens; generate speed: 3.8436858587309564 tokens/s +2024-07-30 14:20:01,727 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:01,727 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1415/2067], cost time 1.0519s, every example cost time is 1.0519, generate speed: 3.8027 tokens/s, avg speed: 10.2764 tokens/s, remaining time: 0:14:50 +pred is: + ['53%'] + label is: + ['53%'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:20:01,809 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:01,809 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 142, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:01,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:01,810 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:01,810 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:02,752 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:02,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:02,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:02,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:02,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:02,909 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:02,939 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:02,970 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:03,001 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:03,031 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:03,340 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5303034782409668 s; generated tokens: 20 tokens; generate speed: 13.06930310515228 tokens/s +2024-07-30 14:20:03,345 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:03,346 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1416/2067], cost time 1.5415s, every example cost time is 1.5415, generate speed: 12.9745 tokens/s, avg speed: 10.2786 tokens/s, remaining time: 0:14:49 +pred is: + ['1'] + label is: + ['social welfare'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:20:03,428 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:03,429 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 254, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:03,429 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:03,429 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:03,430 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:04,374 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:04,407 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:04,438 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:04,469 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:04,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:04,530 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:04,561 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:04,592 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:04,622 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:04,653 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:04,808 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.378021478652954 s; generated tokens: 15 tokens; generate speed: 10.885171408694461 tokens/s +2024-07-30 14:20:04,813 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:04,813 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1417/2067], cost time 1.3896s, every example cost time is 1.3896, generate speed: 10.7941 tokens/s, avg speed: 10.2789 tokens/s, remaining time: 0:14:48 +pred is: + ['1910 to 1940'] + label is: + ['1910 to 1940'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:20:04,895 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:04,895 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 210, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:04,895 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:04,896 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:04,896 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:05,839 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:05,872 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:05,903 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:05,934 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:05,965 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:05,995 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:06,026 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:06,057 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:06,087 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:06,118 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:06,242 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3459303379058838 s; generated tokens: 14 tokens; generate speed: 10.401727047614088 tokens/s +2024-07-30 14:20:06,247 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:06,247 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1418/2067], cost time 1.3570s, every example cost time is 1.3570, generate speed: 10.3171 tokens/s, avg speed: 10.2790 tokens/s, remaining time: 0:14:46 +pred is: + ['Wealth condensation'] + label is: + ['Wealth concentration'] +The F1/Em of this example is: {'F1': 66.66666666666666, 'Em': 0.0} +2024-07-30 14:20:06,330 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:06,330 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 213, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:06,330 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:06,331 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:06,331 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:07,274 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:07,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:07,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:07,368 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:07,399 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:07,430 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:07,461 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:07,492 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:07,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:07,553 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:07,860 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5291905403137207 s; generated tokens: 20 tokens; generate speed: 13.07881488457083 tokens/s +2024-07-30 14:20:07,865 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:07,865 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1419/2067], cost time 1.5403s, every example cost time is 1.5403, generate speed: 12.9843 tokens/s, avg speed: 10.2811 tokens/s, remaining time: 0:14:45 +pred is: + ['market forces'] + label is: + ['market'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:20:07,948 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:07,948 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 152, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:07,948 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:07,949 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:07,949 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:08,891 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:08,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:08,955 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:08,986 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:09,017 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:09,047 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:09,077 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:09,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:09,139 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:09,169 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:09,485 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.53645658493042 s; generated tokens: 20 tokens; generate speed: 13.016963965113092 tokens/s +2024-07-30 14:20:09,490 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:09,491 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1420/2067], cost time 1.5478s, every example cost time is 1.5478, generate speed: 12.9219 tokens/s, avg speed: 10.2832 tokens/s, remaining time: 0:14:44 +pred is: + ['inequality'] + label is: + ['inequality'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.53712716455198, Em score: 50.49295774647887, current_count: 1420 +2024-07-30 14:20:09,993 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:09,994 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 178, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:09,994 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:09,994 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:09,994 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:10,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:10,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:11,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:11,033 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:11,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:11,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:11,125 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:11,156 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:11,186 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:11,217 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:11,311 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3159854412078857 s; generated tokens: 13 tokens; generate speed: 9.878528738181075 tokens/s +2024-07-30 14:20:11,316 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:11,316 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1421/2067], cost time 1.3278s, every example cost time is 1.3278, generate speed: 9.7905 tokens/s, avg speed: 10.2829 tokens/s, remaining time: 0:14:42 +pred is: + ['2013'] + label is: + ['2013'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:20:11,398 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:11,398 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 198, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:11,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:11,399 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:11,399 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:12,342 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:12,375 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:12,406 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:12,409 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0103344917297363 s; generated tokens: 3 tokens; generate speed: 2.969313652614067 tokens/s +2024-07-30 14:20:12,414 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:12,414 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1422/2067], cost time 1.0215s, every example cost time is 1.0215, generate speed: 2.9369 tokens/s, avg speed: 10.2790 tokens/s, remaining time: 0:14:41 +pred is: + ['British'] + label is: + ['British'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:20:12,504 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:12,505 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 197, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:12,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:12,505 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:12,506 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:13,449 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:13,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:13,513 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:13,544 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:13,575 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:13,605 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:13,636 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:13,667 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:13,698 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:13,728 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:14,068 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5625545978546143 s; generated tokens: 20 tokens; generate speed: 12.79955275000309 tokens/s +2024-07-30 14:20:14,073 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:14,073 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1423/2067], cost time 1.5742s, every example cost time is 1.5742, generate speed: 12.7048 tokens/s, avg speed: 10.2810 tokens/s, remaining time: 0:14:40 +pred is: + ['1'] + label is: + ['better health and longer lives'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:20:14,156 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:14,156 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:14,157 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:14,157 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:14,157 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:15,099 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:15,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:15,162 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:15,199 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:15,231 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:15,262 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:15,293 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:15,323 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:15,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:15,385 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:15,692 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.53480863571167 s; generated tokens: 20 tokens; generate speed: 13.030940492934008 tokens/s +2024-07-30 14:20:15,697 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:15,697 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1424/2067], cost time 1.5460s, every example cost time is 1.5460, generate speed: 12.9369 tokens/s, avg speed: 10.2831 tokens/s, remaining time: 0:14:38 +pred is: + ['income inequality'] + label is: + ['income inequality'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:20:15,780 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:15,780 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 223, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:15,781 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:15,781 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:15,781 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:16,725 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:16,757 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:16,788 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:16,818 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:16,849 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:16,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:16,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:16,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:16,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:17,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:17,309 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.528062343597412 s; generated tokens: 20 tokens; generate speed: 13.088471215719755 tokens/s +2024-07-30 14:20:17,314 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:17,314 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1425/2067], cost time 1.5392s, every example cost time is 1.5392, generate speed: 12.9939 tokens/s, avg speed: 10.2852 tokens/s, remaining time: 0:14:37 +pred is: + ['inequality'] + label is: + ['inequality'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:20:17,404 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:17,405 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 257, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:17,405 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:17,405 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:17,406 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:18,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:18,383 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:18,414 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:18,445 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:18,478 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:18,510 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:18,541 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:18,572 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:18,603 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:18,634 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:18,944 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5380845069885254 s; generated tokens: 20 tokens; generate speed: 13.00318669691223 tokens/s +2024-07-30 14:20:18,949 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:18,949 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1426/2067], cost time 1.5496s, every example cost time is 1.5496, generate speed: 12.9068 tokens/s, avg speed: 10.2873 tokens/s, remaining time: 0:14:36 +pred is: + ['1'] + label is: + ['the greatest good'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:20:19,032 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:19,032 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 244, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:19,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:19,033 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:19,033 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:19,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:20,010 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:20,041 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:20,072 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:20,103 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:20,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:20,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:20,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:20,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:20,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:20,326 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2926597595214844 s; generated tokens: 12 tokens; generate speed: 9.283185240052765 tokens/s +2024-07-30 14:20:20,330 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:20,331 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1427/2067], cost time 1.3038s, every example cost time is 1.3038, generate speed: 9.2041 tokens/s, avg speed: 10.2866 tokens/s, remaining time: 0:14:34 +pred is: + ['Consumption'] + label is: + ['consumption'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:20:20,412 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:20,413 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 179, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:20,413 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:20,413 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:20,414 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:21,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:21,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:21,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:21,453 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:21,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:21,515 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:21,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:21,576 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:21,607 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:21,637 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:21,944 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5307188034057617 s; generated tokens: 20 tokens; generate speed: 13.06575705185116 tokens/s +2024-07-30 14:20:21,949 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:21,950 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1428/2067], cost time 1.5419s, every example cost time is 1.5419, generate speed: 12.9707 tokens/s, avg speed: 10.2887 tokens/s, remaining time: 0:14:33 +pred is: + ['Economist'] + label is: + ['economist'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:20:22,032 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:22,032 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 196, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:22,033 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:22,033 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:22,033 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:22,976 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:23,008 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:23,039 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:23,070 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:23,101 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:23,132 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:23,163 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:23,193 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:23,224 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:23,254 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:23,562 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5284545421600342 s; generated tokens: 20 tokens; generate speed: 13.085112738607004 tokens/s +2024-07-30 14:20:23,566 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:23,567 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1429/2067], cost time 1.5396s, every example cost time is 1.5396, generate speed: 12.9900 tokens/s, avg speed: 10.2908 tokens/s, remaining time: 0:14:32 +pred is: + ['Inequality'] + label is: + ['inequality in wealth and income'] +The F1/Em of this example is: {'F1': 20.0, 'Em': 0.0} +2024-07-30 14:20:23,649 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:23,649 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:23,650 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:23,650 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:23,650 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:24,593 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:24,626 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:24,657 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:24,688 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:24,719 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:24,750 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:24,781 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:24,812 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:24,842 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:24,873 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:25,179 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.528921365737915 s; generated tokens: 20 tokens; generate speed: 13.081117478103426 tokens/s +2024-07-30 14:20:25,184 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:25,184 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1430/2067], cost time 1.5401s, every example cost time is 1.5401, generate speed: 12.9865 tokens/s, avg speed: 10.2930 tokens/s, remaining time: 0:14:31 +pred is: + ['1'] + label is: + ['economists'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 64.51938501654811, Em score: 50.55944055944056, current_count: 1430 +2024-07-30 14:20:25,687 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:25,687 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 202, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:25,688 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:25,688 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:25,688 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:26,632 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:26,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:26,695 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:26,726 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:26,756 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:26,787 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:26,818 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:26,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:26,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:26,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:27,220 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5315804481506348 s; generated tokens: 20 tokens; generate speed: 13.058406448156061 tokens/s +2024-07-30 14:20:27,225 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:27,225 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1431/2067], cost time 1.5433s, every example cost time is 1.5433, generate speed: 12.9596 tokens/s, avg speed: 10.2951 tokens/s, remaining time: 0:14:29 +pred is: + ['Stiglitz presented evidence in 2009 that both global inequality and inequality within countries prevent'] + label is: + ['evidence'] +The F1/Em of this example is: {'F1': 7.142857142857142, 'Em': 0.0} +2024-07-30 14:20:27,309 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:27,309 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 236, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:27,310 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:27,310 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:27,310 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:28,254 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:28,287 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:28,318 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:28,349 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:28,380 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:28,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:28,442 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:28,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:28,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:28,534 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:28,567 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.257256031036377 s; generated tokens: 11 tokens; generate speed: 8.749212354887268 tokens/s +2024-07-30 14:20:28,572 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:28,572 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1432/2067], cost time 1.2684s, every example cost time is 1.2684, generate speed: 8.6724 tokens/s, avg speed: 10.2940 tokens/s, remaining time: 0:14:28 +pred is: + ['1993'] + label is: + ['1993'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:20:28,655 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:28,655 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 171, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:28,655 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:28,656 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:28,656 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:29,598 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:29,632 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:29,663 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:29,698 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:29,728 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:29,759 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:29,791 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:29,821 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:29,853 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:29,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:30,193 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5372631549835205 s; generated tokens: 20 tokens; generate speed: 13.01013423444368 tokens/s +2024-07-30 14:20:30,198 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:30,198 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1433/2067], cost time 1.5486s, every example cost time is 1.5486, generate speed: 12.9149 tokens/s, avg speed: 10.2961 tokens/s, remaining time: 0:14:27 +pred is: + ['Reduce growth'] + label is: + ['reduce'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:20:30,282 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:30,282 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 162, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:30,282 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:30,282 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:30,283 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:31,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:31,259 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:31,290 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:31,321 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:31,353 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:31,384 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:31,414 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:31,445 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:31,476 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:31,506 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:31,813 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.530470371246338 s; generated tokens: 20 tokens; generate speed: 13.06787793854056 tokens/s +2024-07-30 14:20:31,818 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:31,818 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1434/2067], cost time 1.5419s, every example cost time is 1.5419, generate speed: 12.9708 tokens/s, avg speed: 10.2982 tokens/s, remaining time: 0:14:25 +pred is: + ['1'] + label is: + ['Kuznets curve hypothesis'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:20:31,900 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:31,901 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 234, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:31,901 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:31,901 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:31,902 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:32,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:32,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:32,909 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:32,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:32,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:33,001 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:33,035 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:33,066 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:33,097 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:33,127 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:33,221 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3197040557861328 s; generated tokens: 13 tokens; generate speed: 9.85069337553566 tokens/s +2024-07-30 14:20:33,226 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:33,227 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1435/2067], cost time 1.3309s, every example cost time is 1.3309, generate speed: 9.7679 tokens/s, avg speed: 10.2978 tokens/s, remaining time: 0:14:24 +pred is: + ['1970s'] + label is: + ['the 1970s'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:20:33,309 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:33,309 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 221, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:33,310 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:33,310 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:33,310 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:34,253 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:34,286 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:34,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:34,348 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:34,379 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:34,410 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:34,440 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:34,471 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:34,502 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:34,532 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:34,839 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5284309387207031 s; generated tokens: 20 tokens; generate speed: 13.085314810978637 tokens/s +2024-07-30 14:20:34,843 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:34,844 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1436/2067], cost time 1.5397s, every example cost time is 1.5397, generate speed: 12.9894 tokens/s, avg speed: 10.2999 tokens/s, remaining time: 0:14:23 +pred is: + ['Special efforts must be made to ensure poorer sections of society are able to participate in economic growth.'] + label is: + ['special efforts'] +The F1/Em of this example is: {'F1': 15.384615384615385, 'Em': 0.0} +2024-07-30 14:20:34,927 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:34,927 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 162, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:34,928 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:34,928 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:34,928 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:35,871 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:35,903 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:35,934 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:35,965 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:35,995 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:36,026 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:36,057 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:36,087 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:36,118 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:36,149 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:36,456 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5277507305145264 s; generated tokens: 20 tokens; generate speed: 13.09114085205789 tokens/s +2024-07-30 14:20:36,461 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:36,461 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1437/2067], cost time 1.5390s, every example cost time is 1.5390, generate speed: 12.9952 tokens/s, avg speed: 10.3021 tokens/s, remaining time: 0:14:21 +pred is: + ['1'] + label is: + ['much land and housing'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:20:36,545 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:36,545 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 203, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:36,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:36,545 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:36,546 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:37,489 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:37,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:37,553 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:37,584 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:37,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:37,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:37,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:37,707 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:37,737 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:37,768 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:38,076 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5297214984893799 s; generated tokens: 20 tokens; generate speed: 13.074275297660563 tokens/s +2024-07-30 14:20:38,081 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:38,081 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1438/2067], cost time 1.5411s, every example cost time is 1.5411, generate speed: 12.9773 tokens/s, avg speed: 10.3041 tokens/s, remaining time: 0:14:20 +pred is: + ['1'] + label is: + ['a shortage of affordable housing'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:20:38,163 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:38,163 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:38,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:38,164 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:38,164 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:39,107 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:39,140 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:39,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:39,201 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:39,232 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:39,262 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:39,293 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:39,324 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:39,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:39,385 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:39,701 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5366315841674805 s; generated tokens: 20 tokens; generate speed: 13.015481528603125 tokens/s +2024-07-30 14:20:39,706 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:39,707 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1439/2067], cost time 1.5484s, every example cost time is 1.5484, generate speed: 12.9169 tokens/s, avg speed: 10.3062 tokens/s, remaining time: 0:14:19 +pred is: + ['1'] + label is: + ['by everyone'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:20:39,790 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:39,790 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 287, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:39,791 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:39,791 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:39,791 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:40,736 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:40,770 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:40,773 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 0.9817399978637695 s; generated tokens: 2 tokens; generate speed: 2.0371992628923414 tokens/s +2024-07-30 14:20:40,778 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:40,778 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1440/2067], cost time 0.9935s, every example cost time is 0.9935, generate speed: 2.0130 tokens/s, avg speed: 10.3020 tokens/s, remaining time: 0:14:17 +pred is: + ['A'] + label is: + ['created'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 64.22586669874393, Em score: 50.27777777777778, current_count: 1440 +2024-07-30 14:20:41,276 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:41,276 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 163, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:41,277 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:41,277 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:41,277 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:42,220 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:42,254 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:42,286 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:42,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:42,347 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:42,378 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:42,409 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:42,441 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:42,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:42,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:42,812 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5348401069641113 s; generated tokens: 20 tokens; generate speed: 13.030673298966414 tokens/s +2024-07-30 14:20:42,817 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:42,817 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1441/2067], cost time 1.5464s, every example cost time is 1.5464, generate speed: 12.9332 tokens/s, avg speed: 10.3041 tokens/s, remaining time: 0:14:16 +pred is: + ['The private ownership of the means of production by a class of owners'] + label is: + ['private ownership of the means of production'] +The F1/Em of this example is: {'F1': 68.42105263157895, 'Em': 0.0} +2024-07-30 14:20:42,900 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:42,901 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 217, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:42,901 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:42,901 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:42,902 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:43,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:43,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:43,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:43,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:43,973 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:44,004 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:44,035 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:44,065 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:44,096 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:44,127 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:44,441 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5387859344482422 s; generated tokens: 20 tokens; generate speed: 12.99725943178142 tokens/s +2024-07-30 14:20:44,445 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:44,446 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1442/2067], cost time 1.5500s, every example cost time is 1.5500, generate speed: 12.9030 tokens/s, avg speed: 10.3061 tokens/s, remaining time: 0:14:15 +pred is: + ['1'] + label is: + ['Robert Nozick'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:20:44,528 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:44,528 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 158, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:44,528 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:44,529 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:44,529 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:45,471 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:45,504 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:45,535 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:45,566 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:45,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:45,628 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:45,659 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:45,689 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:45,720 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:45,751 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:46,058 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5288176536560059 s; generated tokens: 20 tokens; generate speed: 13.082004876233679 tokens/s +2024-07-30 14:20:46,063 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:46,063 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1443/2067], cost time 1.5401s, every example cost time is 1.5401, generate speed: 12.9863 tokens/s, avg speed: 10.3082 tokens/s, remaining time: 0:14:13 +pred is: + ['capability deprivation'] + label is: + ['capability deprivation'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:20:46,146 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:46,147 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 220, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:46,147 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:46,147 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:46,148 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:47,091 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:47,124 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:47,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:47,188 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:47,219 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:47,249 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:47,280 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:47,311 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:47,342 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:47,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:47,682 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5344033241271973 s; generated tokens: 20 tokens; generate speed: 13.034382606917543 tokens/s +2024-07-30 14:20:47,687 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:47,687 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1444/2067], cost time 1.5456s, every example cost time is 1.5456, generate speed: 12.9401 tokens/s, avg speed: 10.3103 tokens/s, remaining time: 0:14:12 +pred is: + ['1'] + label is: + ['deprived of earning as much'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:20:47,770 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:47,771 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 158, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:47,771 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:47,771 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:47,771 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:48,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:48,747 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:48,750 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 0.9787983894348145 s; generated tokens: 2 tokens; generate speed: 2.043321711179823 tokens/s +2024-07-30 14:20:48,755 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:48,755 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1445/2067], cost time 0.9900s, every example cost time is 0.9900, generate speed: 2.0201 tokens/s, avg speed: 10.3061 tokens/s, remaining time: 0:14:10 +pred is: + ['BBC'] + label is: + ['BBC'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:20:48,838 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:48,838 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 274, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:48,838 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:48,838 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:48,839 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:49,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:49,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:49,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:49,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:49,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:49,941 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:49,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:49,975 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1363253593444824 s; generated tokens: 7 tokens; generate speed: 6.160207499054781 tokens/s +2024-07-30 14:20:49,980 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:49,980 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1446/2067], cost time 1.1477s, every example cost time is 1.1477, generate speed: 6.0992 tokens/s, avg speed: 10.3037 tokens/s, remaining time: 0:14:09 +pred is: + ['1963-1989'] + label is: + ['1963 to 1989'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:20:50,062 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:50,063 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 221, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:50,063 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:50,063 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:50,064 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:51,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:51,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:51,072 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:51,075 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0109014511108398 s; generated tokens: 3 tokens; generate speed: 2.967648326850672 tokens/s +2024-07-30 14:20:51,079 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:51,080 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1447/2067], cost time 1.0220s, every example cost time is 1.0220, generate speed: 2.9353 tokens/s, avg speed: 10.2999 tokens/s, remaining time: 0:14:08 +pred is: + ['12'] + label is: + ['Twelve'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:20:51,162 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:51,162 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 169, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:51,162 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:51,162 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:51,163 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:52,106 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:52,139 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:52,170 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:52,201 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:52,232 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:52,263 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:52,293 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:52,324 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:52,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:52,385 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:52,695 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.532106637954712 s; generated tokens: 20 tokens; generate speed: 13.053921642620796 tokens/s +2024-07-30 14:20:52,700 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:52,700 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1448/2067], cost time 1.5433s, every example cost time is 1.5433, generate speed: 12.9594 tokens/s, avg speed: 10.3019 tokens/s, remaining time: 0:14:06 +pred is: + ['Gallifrey'] + label is: + ['Gallifrey'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:20:52,782 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:52,782 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 181, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:52,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:52,783 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:52,783 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:53,726 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:53,759 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:53,790 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:53,821 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:53,852 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:53,854 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0709607601165771 s; generated tokens: 5 tokens; generate speed: 4.6687051348694935 tokens/s +2024-07-30 14:20:53,859 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:53,859 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1449/2067], cost time 1.0820s, every example cost time is 1.0820, generate speed: 4.6211 tokens/s, avg speed: 10.2988 tokens/s, remaining time: 0:14:05 +pred is: + ['rarely'] + label is: + ['rarely'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:20:53,940 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:53,941 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 485, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:53,941 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:53,941 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:53,942 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:54,889 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:54,923 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:54,956 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:54,988 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:55,019 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:55,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:55,081 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:55,112 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:55,115 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1733388900756836 s; generated tokens: 8 tokens; generate speed: 6.818149528380482 tokens/s +2024-07-30 14:20:55,120 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:55,120 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1450/2067], cost time 1.1844s, every example cost time is 1.1844, generate speed: 6.7542 tokens/s, avg speed: 10.2967 tokens/s, remaining time: 0:14:03 +pred is: + ['1963-11-23'] + label is: + ['23 November 1963'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 64.10597868884335, Em score: 50.206896551724135, current_count: 1450 +2024-07-30 14:20:55,620 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:55,620 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 175, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:55,621 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:55,621 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:55,621 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:56,564 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:56,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:56,629 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:56,632 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0105056762695312 s; generated tokens: 3 tokens; generate speed: 2.9688106365468974 tokens/s +2024-07-30 14:20:56,637 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:56,637 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1451/2067], cost time 1.0219s, every example cost time is 1.0219, generate speed: 2.9358 tokens/s, avg speed: 10.2929 tokens/s, remaining time: 0:14:02 +pred is: + ['26'] + label is: + ['26'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:20:56,718 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:56,719 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 196, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:56,719 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:56,719 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:56,719 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:57,662 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:57,695 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:57,727 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:57,758 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:57,788 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:57,819 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:57,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:57,881 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:57,912 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:57,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:58,250 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5303280353546143 s; generated tokens: 20 tokens; generate speed: 13.06909338256063 tokens/s +2024-07-30 14:20:58,255 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:58,255 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1452/2067], cost time 1.5415s, every example cost time is 1.5415, generate speed: 12.9745 tokens/s, avg speed: 10.2950 tokens/s, remaining time: 0:14:00 +pred is: + ['Relaunch the show'] + label is: + ['relaunch the show'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:20:58,338 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:58,338 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 204, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:58,339 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:58,339 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:58,339 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:20:59,283 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:59,321 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:59,353 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:59,383 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:59,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:59,446 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:59,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:59,514 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:59,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:59,548 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.20865797996521 s; generated tokens: 9 tokens; generate speed: 7.446275248403238 tokens/s +2024-07-30 14:20:59,553 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:20:59,553 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1453/2067], cost time 1.2198s, every example cost time is 1.2198, generate speed: 7.3784 tokens/s, avg speed: 10.2932 tokens/s, remaining time: 0:13:59 +pred is: + ['Rose'] + label is: + ['Rose'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:20:59,635 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:20:59,636 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:20:59,636 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:20:59,636 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:20:59,636 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:00,580 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:00,636 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:00,669 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:00,700 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:00,731 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:00,762 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:00,793 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:00,796 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1591136455535889 s; generated tokens: 7 tokens; generate speed: 6.0390972247219326 tokens/s +2024-07-30 14:21:00,801 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:00,801 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1454/2067], cost time 1.1705s, every example cost time is 1.1705, generate speed: 5.9804 tokens/s, avg speed: 10.2907 tokens/s, remaining time: 0:13:58 +pred is: + ['1963-1989'] + label is: + ['1963–1989'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:21:00,883 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:00,883 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 152, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:00,884 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:00,884 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:00,884 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:01,827 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:01,860 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:01,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:01,923 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:01,954 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:01,985 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:02,016 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:02,018 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1338679790496826 s; generated tokens: 7 tokens; generate speed: 6.173558235471858 tokens/s +2024-07-30 14:21:02,023 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:02,023 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1455/2067], cost time 1.1451s, every example cost time is 1.1451, generate speed: 6.1132 tokens/s, avg speed: 10.2883 tokens/s, remaining time: 0:13:56 +pred is: + ['30 November 1963'] + label is: + ['30 November 1963'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:21:02,129 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:02,129 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:02,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:02,130 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:02,130 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:03,074 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:03,106 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:03,137 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:03,168 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:03,199 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:03,230 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:03,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:03,264 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1341090202331543 s; generated tokens: 7 tokens; generate speed: 6.172246120184208 tokens/s +2024-07-30 14:21:03,269 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:03,269 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1456/2067], cost time 1.1456s, every example cost time is 1.1456, generate speed: 6.1101 tokens/s, avg speed: 10.2859 tokens/s, remaining time: 0:13:55 +pred is: + ['Hiding behind the sofa'] + label is: + ["Hiding behind (or 'watching from behind') the sofa"] +The F1/Em of this example is: {'F1': 30.76923076923077, 'Em': 0.0} +2024-07-30 14:21:03,352 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:03,352 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 234, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:03,353 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:03,353 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:03,353 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:04,296 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:04,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:04,360 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:04,391 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:04,422 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:04,453 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:04,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:04,514 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:04,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:04,576 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:04,884 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5311059951782227 s; generated tokens: 20 tokens; generate speed: 13.062452934665686 tokens/s +2024-07-30 14:21:04,889 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:04,889 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1457/2067], cost time 1.5422s, every example cost time is 1.5422, generate speed: 12.9684 tokens/s, avg speed: 10.2880 tokens/s, remaining time: 0:13:53 +pred is: + ['1'] + label is: + ['Doctor Who'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:21:04,971 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:04,972 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 170, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:04,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:04,972 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:04,972 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:05,915 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:05,948 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:05,979 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:06,010 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:06,041 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:06,072 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:06,103 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:06,133 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:06,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:06,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:06,507 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.534498691558838 s; generated tokens: 20 tokens; generate speed: 13.033572534156267 tokens/s +2024-07-30 14:21:06,512 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:06,512 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1458/2067], cost time 1.5457s, every example cost time is 1.5457, generate speed: 12.9395 tokens/s, avg speed: 10.2900 tokens/s, remaining time: 0:13:52 +pred is: + ['TARDIS'] + label is: + ['the TARDIS'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:21:06,595 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:06,595 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 272, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:06,596 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:06,596 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:06,596 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:07,541 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:07,574 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:07,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:07,637 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:07,668 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:07,699 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:07,730 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:07,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:07,791 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:07,822 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:08,133 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.536900281906128 s; generated tokens: 20 tokens; generate speed: 13.013206019583238 tokens/s +2024-07-30 14:21:08,138 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:08,138 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1459/2067], cost time 1.5481s, every example cost time is 1.5481, generate speed: 12.9191 tokens/s, avg speed: 10.2921 tokens/s, remaining time: 0:13:51 +pred is: + ['26'] + label is: + ['26'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:21:08,220 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:08,221 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 192, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:08,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:08,221 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:08,222 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:09,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:09,197 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:09,247 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:09,279 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:09,282 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0598962306976318 s; generated tokens: 4 tokens; generate speed: 3.77395435906699 tokens/s +2024-07-30 14:21:09,286 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:09,287 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1460/2067], cost time 1.0710s, every example cost time is 1.0710, generate speed: 3.7349 tokens/s, avg speed: 10.2885 tokens/s, remaining time: 0:13:49 +pred is: + ['2005'] + label is: + ['2005'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.13317693807677, Em score: 50.273972602739725, current_count: 1460 +2024-07-30 14:21:09,792 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:09,792 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 320, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:09,793 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:09,793 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:09,793 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:10,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:10,772 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:10,803 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:10,806 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0130596160888672 s; generated tokens: 3 tokens; generate speed: 2.9613262164986303 tokens/s +2024-07-30 14:21:10,811 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:10,811 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1461/2067], cost time 1.0246s, every example cost time is 1.0246, generate speed: 2.9280 tokens/s, avg speed: 10.2848 tokens/s, remaining time: 0:13:48 +pred is: + ['826'] + label is: + ['826'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:21:10,918 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:10,919 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 216, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:10,919 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:10,920 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:10,920 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:11,864 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:11,897 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:11,928 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:11,959 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:11,990 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:12,021 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:12,052 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:12,083 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:12,114 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:12,144 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:12,454 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5339653491973877 s; generated tokens: 20 tokens; generate speed: 13.038104159565627 tokens/s +2024-07-30 14:21:12,459 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:12,459 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1462/2067], cost time 1.5456s, every example cost time is 1.5456, generate speed: 12.9402 tokens/s, avg speed: 10.2868 tokens/s, remaining time: 0:13:47 +pred is: + ['William Hartnell and Patrick Troughton'] + label is: + ['William Hartnell and Patrick Troughton'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:21:12,542 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:12,542 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 171, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:12,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:12,543 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:12,543 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:13,486 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:13,519 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:13,550 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:13,581 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:13,612 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:13,642 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:13,673 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:13,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:13,735 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:13,765 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:14,073 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5296001434326172 s; generated tokens: 20 tokens; generate speed: 13.075312581442008 tokens/s +2024-07-30 14:21:14,078 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:14,078 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1463/2067], cost time 1.5409s, every example cost time is 1.5409, generate speed: 12.9792 tokens/s, avg speed: 10.2889 tokens/s, remaining time: 0:13:45 +pred is: + ['They bought prints for broadcast'] + label is: + ['bought prints for broadcast'] +The F1/Em of this example is: {'F1': 87.50000000000001, 'Em': 0.0} +2024-07-30 14:21:14,161 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:14,161 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 193, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:14,162 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:14,162 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:14,162 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:15,105 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:15,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:15,169 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:15,200 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:15,231 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:15,262 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:15,293 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:15,296 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1331830024719238 s; generated tokens: 7 tokens; generate speed: 6.177289974108516 tokens/s +2024-07-30 14:21:15,300 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:15,301 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1464/2067], cost time 1.1442s, every example cost time is 1.1442, generate speed: 6.1178 tokens/s, avg speed: 10.2865 tokens/s, remaining time: 0:13:44 +pred is: + ['BBC'] + label is: + ['the BBC'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:21:15,382 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:15,383 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 175, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:15,383 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:15,383 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:15,384 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:16,327 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:16,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:16,391 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:16,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:16,425 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.040820837020874 s; generated tokens: 4 tokens; generate speed: 3.843120600322665 tokens/s +2024-07-30 14:21:16,429 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:16,430 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1465/2067], cost time 1.0521s, every example cost time is 1.0521, generate speed: 3.8020 tokens/s, avg speed: 10.2831 tokens/s, remaining time: 0:13:42 +pred is: + ['regeneration'] + label is: + ['regeneration'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:21:16,513 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:16,513 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 181, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:16,513 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:16,513 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:16,514 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:17,456 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:17,489 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:17,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:17,524 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0096535682678223 s; generated tokens: 3 tokens; generate speed: 2.9713161962541745 tokens/s +2024-07-30 14:21:17,528 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:17,528 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1466/2067], cost time 1.0207s, every example cost time is 1.0207, generate speed: 2.9390 tokens/s, avg speed: 10.2794 tokens/s, remaining time: 0:13:41 +pred is: + ['13'] + label is: + ['12'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:21:17,610 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:17,610 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 220, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:17,611 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:17,611 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:17,611 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:18,554 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:18,587 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:18,619 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:18,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:18,682 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:18,713 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:18,744 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:18,774 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:18,805 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:18,836 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:19,166 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5545439720153809 s; generated tokens: 20 tokens; generate speed: 12.865509345529222 tokens/s +2024-07-30 14:21:19,171 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:19,171 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1467/2067], cost time 1.5658s, every example cost time is 1.5658, generate speed: 12.7728 tokens/s, avg speed: 10.2813 tokens/s, remaining time: 0:13:39 +pred is: + ['John Hurt'] + label is: + ['John Hurt'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:21:19,254 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:19,254 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 435, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:19,254 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:19,255 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:19,255 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:20,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:20,235 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:20,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:20,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:20,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:20,332 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0767056941986084 s; generated tokens: 5 tokens; generate speed: 4.643794517796711 tokens/s +2024-07-30 14:21:20,336 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:20,337 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1468/2067], cost time 1.0878s, every example cost time is 1.0878, generate speed: 4.5963 tokens/s, avg speed: 10.2782 tokens/s, remaining time: 0:13:38 +pred is: + ['The War Doctor'] + label is: + ['the War Doctor'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:21:20,419 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:20,420 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 195, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:20,420 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:20,420 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:20,421 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:21,364 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:21,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:21,430 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:21,464 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:21,496 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:21,527 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:21,558 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:21,588 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:21,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:21,675 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:21,994 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5733702182769775 s; generated tokens: 20 tokens; generate speed: 12.711566399103647 tokens/s +2024-07-30 14:21:21,999 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:21,999 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1469/2067], cost time 1.5850s, every example cost time is 1.5850, generate speed: 12.6182 tokens/s, avg speed: 10.2801 tokens/s, remaining time: 0:13:37 +pred is: + ['Peter Davison, Colin Baker, Sylvester McCoy'] + label is: + ['Peter Davison, Colin Baker and Sylvester McCoy'] +The F1/Em of this example is: {'F1': 59.25925925925927, 'Em': 0.0} +2024-07-30 14:21:22,082 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:22,083 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 319, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:22,083 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:22,083 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:22,084 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:23,029 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:23,062 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:23,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:23,126 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:23,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:23,190 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:23,222 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:23,225 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.141357421875 s; generated tokens: 7 tokens; generate speed: 6.133048128342246 tokens/s +2024-07-30 14:21:23,230 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:23,230 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1470/2067], cost time 1.1525s, every example cost time is 1.1525, generate speed: 6.0738 tokens/s, avg speed: 10.2777 tokens/s, remaining time: 0:13:35 +pred is: + ['The Time of the Doctor'] + label is: + ['The Time of the Doctor'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.23890992438866, Em score: 50.34013605442177, current_count: 1470 +2024-07-30 14:21:23,740 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:23,740 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 270, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:23,741 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:23,741 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:23,741 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:24,686 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:24,721 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:24,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:24,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:24,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:24,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:24,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:24,912 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:24,943 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:24,974 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:25,315 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.573314905166626 s; generated tokens: 20 tokens; generate speed: 12.712013300275604 tokens/s +2024-07-30 14:21:25,320 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:25,320 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1471/2067], cost time 1.5852s, every example cost time is 1.5852, generate speed: 12.6164 tokens/s, avg speed: 10.2795 tokens/s, remaining time: 0:13:34 +pred is: + ['An Unearthly Child'] + label is: + ['An Unearthly Child'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:21:25,403 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:25,404 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 310, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:25,404 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:25,404 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:25,404 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:26,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:26,384 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:26,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:26,421 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0162756443023682 s; generated tokens: 3 tokens; generate speed: 2.951955029936172 tokens/s +2024-07-30 14:21:26,426 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:26,426 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1472/2067], cost time 1.0280s, every example cost time is 1.0280, generate speed: 2.9184 tokens/s, avg speed: 10.2757 tokens/s, remaining time: 0:13:32 +pred is: + ['Human'] + label is: + ['a human'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:21:26,509 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:26,509 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 244, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:26,510 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:26,510 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:26,510 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:27,455 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:27,489 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:27,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:27,525 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0146360397338867 s; generated tokens: 3 tokens; generate speed: 2.956725251733443 tokens/s +2024-07-30 14:21:27,530 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:27,530 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1473/2067], cost time 1.0263s, every example cost time is 1.0263, generate speed: 2.9232 tokens/s, avg speed: 10.2720 tokens/s, remaining time: 0:13:31 +pred is: + ['Female'] + label is: + ['female'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:21:27,613 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:27,614 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 250, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:27,614 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:27,614 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:27,614 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:28,559 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:28,592 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:28,623 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:28,654 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:28,685 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:28,716 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:28,746 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:28,777 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:28,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:28,839 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:29,173 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5586936473846436 s; generated tokens: 20 tokens; generate speed: 12.831257786646088 tokens/s +2024-07-30 14:21:29,178 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:29,178 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1474/2067], cost time 1.5702s, every example cost time is 1.5702, generate speed: 12.7370 tokens/s, avg speed: 10.2739 tokens/s, remaining time: 0:13:30 +pred is: + ['Russell T Davies'] + label is: + ['Russell T Davies'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:21:29,260 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:29,260 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 291, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:29,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:29,261 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:29,261 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:30,206 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:30,240 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:30,272 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:30,304 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:30,335 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:30,367 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:30,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:30,429 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:30,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:30,491 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:30,812 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5503430366516113 s; generated tokens: 20 tokens; generate speed: 12.900370774196823 tokens/s +2024-07-30 14:21:30,817 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:30,817 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1475/2067], cost time 1.5616s, every example cost time is 1.5616, generate speed: 12.8077 tokens/s, avg speed: 10.2759 tokens/s, remaining time: 0:13:28 +pred is: + ['The Dalek race'] + label is: + ['The Dalek race'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:21:30,899 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:30,899 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 199, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:30,900 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:30,900 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:30,900 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:31,843 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:31,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:31,908 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:31,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:31,941 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.040569543838501 s; generated tokens: 4 tokens; generate speed: 3.844048697835817 tokens/s +2024-07-30 14:21:31,946 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:31,946 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1476/2067], cost time 1.0516s, every example cost time is 1.0516, generate speed: 3.8035 tokens/s, avg speed: 10.2725 tokens/s, remaining time: 0:13:27 +pred is: + ['The Master'] + label is: + ['The Master'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:21:32,028 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:32,028 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 163, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:32,028 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:32,029 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:32,029 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:32,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:33,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:33,035 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:33,066 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:33,096 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:33,127 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:33,158 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:33,189 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:33,220 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:33,250 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:33,557 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5279631614685059 s; generated tokens: 20 tokens; generate speed: 13.089320805861743 tokens/s +2024-07-30 14:21:33,562 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:33,562 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1477/2067], cost time 1.5391s, every example cost time is 1.5391, generate speed: 12.9948 tokens/s, avg speed: 10.2746 tokens/s, remaining time: 0:13:26 +pred is: + ['John Simm'] + label is: + ['Derek Jacobi'] +The F1/Em of this example is: {'F1': 33.33333333333333, 'Em': 0.0} +2024-07-30 14:21:33,644 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:33,645 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 265, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:33,645 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:33,645 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:33,645 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:34,590 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:34,623 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:34,654 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:34,685 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:34,716 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:34,747 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:34,778 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:34,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:34,839 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:34,870 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:35,179 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5337262153625488 s; generated tokens: 20 tokens; generate speed: 13.040137020330134 tokens/s +2024-07-30 14:21:35,184 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:35,184 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1478/2067], cost time 1.5449s, every example cost time is 1.5449, generate speed: 12.9457 tokens/s, avg speed: 10.2766 tokens/s, remaining time: 0:13:24 +pred is: + ['Ron Grainer'] + label is: + ['Ron Grainer'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:21:35,266 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:35,267 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 220, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:35,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:35,267 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:35,268 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:36,211 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:36,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:36,275 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:36,310 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:36,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:36,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:36,403 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:36,434 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:36,465 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:36,496 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:36,744 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4766583442687988 s; generated tokens: 18 tokens; generate speed: 12.189684953098011 tokens/s +2024-07-30 14:21:36,749 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:36,750 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1479/2067], cost time 1.4880s, every example cost time is 1.4880, generate speed: 12.0966 tokens/s, avg speed: 10.2780 tokens/s, remaining time: 0:13:23 +pred is: + ['1'] + label is: + ['Peter Howell'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:21:36,831 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:36,832 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 208, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:36,832 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:36,832 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:36,832 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:37,776 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:37,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:37,839 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:37,871 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:37,902 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:37,933 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:37,964 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:37,995 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:38,026 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:38,057 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:38,365 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5326027870178223 s; generated tokens: 20 tokens; generate speed: 13.049695700290687 tokens/s +2024-07-30 14:21:38,370 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:38,370 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1480/2067], cost time 1.5438s, every example cost time is 1.5438, generate speed: 12.9553 tokens/s, avg speed: 10.2800 tokens/s, remaining time: 0:13:22 +pred is: + ['Voyage of the Damned'] + label is: + ['Voyage of the Damned'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.33414251498965, Em score: 50.472972972972975, current_count: 1480 +2024-07-30 14:21:38,878 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:38,878 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 394, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:38,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:38,879 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:38,879 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:39,826 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:39,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:39,890 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:39,921 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:39,952 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:39,983 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:40,014 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:40,045 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:40,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:40,107 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:40,109 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.229740858078003 s; generated tokens: 10 tokens; generate speed: 8.131794543794605 tokens/s +2024-07-30 14:21:40,114 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:40,114 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1481/2067], cost time 1.2410s, every example cost time is 1.2410, generate speed: 8.0578 tokens/s, avg speed: 10.2786 tokens/s, remaining time: 0:13:20 +pred is: + ['Jon Pertwee'] + label is: + ['Jon Pertwee'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:21:40,196 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:40,196 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 197, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:40,197 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:40,197 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:40,197 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:41,141 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:41,180 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:41,184 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 0.9861278533935547 s; generated tokens: 2 tokens; generate speed: 2.028134580234616 tokens/s +2024-07-30 14:21:41,188 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:41,189 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1482/2067], cost time 0.9972s, every example cost time is 0.9972, generate speed: 2.0057 tokens/s, avg speed: 10.2746 tokens/s, remaining time: 0:13:19 +pred is: + ['Simpson'] + label is: + ['Dudley Simpson'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:21:41,270 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:41,270 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 307, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:41,271 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:41,271 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:41,271 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:42,216 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:42,249 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:42,280 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:42,311 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:42,342 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:42,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:42,405 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:42,436 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:42,439 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1678118705749512 s; generated tokens: 8 tokens; generate speed: 6.850418463430539 tokens/s +2024-07-30 14:21:42,444 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:42,444 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1483/2067], cost time 1.1789s, every example cost time is 1.1789, generate speed: 6.7859 tokens/s, avg speed: 10.2725 tokens/s, remaining time: 0:13:17 +pred is: + ['The BBC National Orchestra of Wales'] + label is: + ['the BBC National Orchestra of Wales'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:21:42,532 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:42,533 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 188, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:42,533 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:42,533 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:42,534 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:43,477 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:43,509 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:43,540 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:43,543 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0092239379882812 s; generated tokens: 3 tokens; generate speed: 2.972581096302568 tokens/s +2024-07-30 14:21:43,548 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:43,548 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1484/2067], cost time 1.0207s, every example cost time is 1.0207, generate speed: 2.9392 tokens/s, avg speed: 10.2688 tokens/s, remaining time: 0:13:16 +pred is: + ['6'] + label is: + ['Six'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:21:43,630 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:43,630 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 330, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:43,630 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:43,630 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:43,631 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:44,576 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:44,609 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:44,640 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:44,672 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:44,702 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:44,733 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:44,764 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:44,795 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:44,826 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:44,857 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:45,169 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.538266897201538 s; generated tokens: 20 tokens; generate speed: 13.001644926757905 tokens/s +2024-07-30 14:21:45,174 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:45,174 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1485/2067], cost time 1.5496s, every example cost time is 1.5496, generate speed: 12.9068 tokens/s, avg speed: 10.2709 tokens/s, remaining time: 0:13:15 +pred is: + ['The original logo used for the First Doctor (and briefly for the Second Doctor) was reused in'] + label is: + ['The original logo'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 14:21:45,258 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:45,258 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 221, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:45,259 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:45,259 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:45,259 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:46,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:46,235 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:46,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:46,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:46,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:46,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:46,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:46,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:46,451 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:46,454 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1949937343597412 s; generated tokens: 9 tokens; generate speed: 7.531420241983159 tokens/s +2024-07-30 14:21:46,459 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:46,459 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1486/2067], cost time 1.2062s, every example cost time is 1.2062, generate speed: 7.4615 tokens/s, avg speed: 10.2692 tokens/s, remaining time: 0:13:13 +pred is: + ['The assassination of John F. Kennedy'] + label is: + ['the assassination of John F. Kennedy'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:21:46,541 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:46,541 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 216, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:46,542 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:46,542 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:46,542 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:47,485 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:47,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:47,550 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:47,581 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:47,612 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:47,643 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:47,674 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:47,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:47,735 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:47,766 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:47,800 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.257387399673462 s; generated tokens: 11 tokens; generate speed: 8.748298259435916 tokens/s +2024-07-30 14:21:47,804 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:47,805 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1487/2067], cost time 1.2685s, every example cost time is 1.2685, generate speed: 8.6715 tokens/s, avg speed: 10.2682 tokens/s, remaining time: 0:13:12 +pred is: + ['1979'] + label is: + ['During the ITV network strike of 1979'] +The F1/Em of this example is: {'F1': 14.285714285714288, 'Em': 0.0} +2024-07-30 14:21:47,887 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:47,888 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:47,888 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:47,888 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:47,889 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:48,832 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:48,867 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:48,898 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:48,929 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:48,932 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0432376861572266 s; generated tokens: 4 tokens; generate speed: 3.8342173150723 tokens/s +2024-07-30 14:21:48,937 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:48,937 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1488/2067], cost time 1.0546s, every example cost time is 1.0546, generate speed: 3.7930 tokens/s, avg speed: 10.2648 tokens/s, remaining time: 0:13:10 +pred is: + ['TVNZ'] + label is: + ['PBS'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:21:49,019 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:49,019 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 216, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:49,019 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:49,020 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:49,020 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:49,963 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:49,996 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:50,028 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:50,031 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0109286308288574 s; generated tokens: 3 tokens; generate speed: 2.967568538978176 tokens/s +2024-07-30 14:21:50,036 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:50,036 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1489/2067], cost time 1.0220s, every example cost time is 1.0220, generate speed: 2.9354 tokens/s, avg speed: 10.2611 tokens/s, remaining time: 0:13:09 +pred is: + ['ABC'] + label is: + ['Australian Broadcasting Corporation (ABC)'] +The F1/Em of this example is: {'F1': 20.0, 'Em': 0.0} +2024-07-30 14:21:50,118 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:50,118 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:50,119 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:50,119 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:50,119 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:51,063 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:51,096 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:51,127 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:51,158 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:51,189 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:51,220 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:51,251 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:51,282 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:51,313 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:51,344 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:51,377 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2576160430908203 s; generated tokens: 11 tokens; generate speed: 8.746707757453139 tokens/s +2024-07-30 14:21:51,382 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:51,382 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1490/2067], cost time 1.2688s, every example cost time is 1.2688, generate speed: 8.6695 tokens/s, avg speed: 10.2601 tokens/s, remaining time: 0:13:07 +pred is: + ['1976'] + label is: + ['1976'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.24417223924188, Em score: 50.40268456375839, current_count: 1490 +2024-07-30 14:21:51,900 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:51,900 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 171, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:51,901 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:51,901 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:51,901 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:52,844 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:52,877 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:52,908 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:52,939 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:52,970 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:53,001 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:53,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:53,062 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:53,093 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:53,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:53,432 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5308704376220703 s; generated tokens: 20 tokens; generate speed: 13.064462875817481 tokens/s +2024-07-30 14:21:53,437 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:53,437 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1491/2067], cost time 1.5426s, every example cost time is 1.5426, generate speed: 12.9652 tokens/s, avg speed: 10.2622 tokens/s, remaining time: 0:13:06 +pred is: + ['Christopher Eccleston'] + label is: + ['Christopher Eccleston'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:21:53,526 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:53,526 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 214, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:53,527 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:53,527 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:53,527 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:54,470 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:54,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:54,534 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:54,565 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:54,596 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:54,626 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:54,657 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:54,688 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:54,719 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:54,752 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:54,816 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2890863418579102 s; generated tokens: 12 tokens; generate speed: 9.308918735966797 tokens/s +2024-07-30 14:21:54,821 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:54,821 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1492/2067], cost time 1.3006s, every example cost time is 1.3006, generate speed: 9.2267 tokens/s, avg speed: 10.2615 tokens/s, remaining time: 0:13:05 +pred is: + ['United Kingdom, Australia, Canada and the United States'] + label is: + ['the United Kingdom, Australia, Canada and the United States'] +The F1/Em of this example is: {'F1': 94.44444444444444, 'Em': 0.0} +2024-07-30 14:21:54,905 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:54,906 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 194, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:54,906 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:54,906 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:54,906 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:55,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:55,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:55,915 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:55,947 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:55,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:56,008 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:56,039 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:56,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:56,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:56,130 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:56,437 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5299489498138428 s; generated tokens: 20 tokens; generate speed: 13.07233159801411 tokens/s +2024-07-30 14:21:56,441 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:56,442 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1493/2067], cost time 1.5414s, every example cost time is 1.5414, generate speed: 12.9755 tokens/s, avg speed: 10.2636 tokens/s, remaining time: 0:13:03 +pred is: + ['Trevor Martin'] + label is: + ['Trevor Martin'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:21:56,532 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:56,533 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 330, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:56,533 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:56,533 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:56,534 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:57,478 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:57,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:57,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:57,574 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:57,605 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:57,636 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:57,667 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:57,698 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:57,728 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:57,759 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:57,823 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2895853519439697 s; generated tokens: 12 tokens; generate speed: 9.305316613522901 tokens/s +2024-07-30 14:21:57,828 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:57,828 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1494/2067], cost time 1.3013s, every example cost time is 1.3013, generate speed: 9.2213 tokens/s, avg speed: 10.2629 tokens/s, remaining time: 0:13:02 +pred is: + ['Torchwood'] + label is: + ['Torchwood'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:21:57,911 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:57,911 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 215, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:57,912 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:57,912 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:57,912 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:21:58,856 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:58,889 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:58,920 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:58,951 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:58,982 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:58,984 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0719830989837646 s; generated tokens: 5 tokens; generate speed: 4.664252640494032 tokens/s +2024-07-30 14:21:58,989 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:21:58,989 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1495/2067], cost time 1.0830s, every example cost time is 1.0830, generate speed: 4.6167 tokens/s, avg speed: 10.2599 tokens/s, remaining time: 0:13:00 +pred is: + ['Elisabeth Sladen'] + label is: + ['Elisabeth Sladen'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:21:59,071 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:21:59,071 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 180, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:21:59,072 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:21:59,072 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:21:59,072 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:00,015 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:00,048 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:00,087 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:00,119 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:00,150 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:00,152 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.080245018005371 s; generated tokens: 5 tokens; generate speed: 4.628579550621116 tokens/s +2024-07-30 14:22:00,157 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:00,158 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1496/2067], cost time 1.0914s, every example cost time is 1.0914, generate speed: 4.5815 tokens/s, avg speed: 10.2569 tokens/s, remaining time: 0:12:59 +pred is: + ['Dimensions in Time'] + label is: + ['Dimensions in Time'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:22:00,239 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:00,240 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 222, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:00,240 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:00,240 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:00,240 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:01,185 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:01,224 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:01,255 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:01,286 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:01,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:01,348 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:01,379 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:01,409 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:01,440 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:01,470 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:01,473 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.232337474822998 s; generated tokens: 10 tokens; generate speed: 8.114660313674475 tokens/s +2024-07-30 14:22:01,478 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:01,478 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1497/2067], cost time 1.2435s, every example cost time is 1.2435, generate speed: 8.0421 tokens/s, avg speed: 10.2555 tokens/s, remaining time: 0:12:58 +pred is: + ['Doctor Who and the Curse of Fatal Death'] + label is: + ['Doctor Who and the Curse of Fatal Death'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:22:01,560 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:01,561 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 259, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:01,561 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:01,561 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:01,561 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:02,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:02,538 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:02,569 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:02,600 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:02,631 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:02,661 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:02,692 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:02,723 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:02,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:02,784 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:02,848 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.285963535308838 s; generated tokens: 12 tokens; generate speed: 9.331524316603637 tokens/s +2024-07-30 14:22:02,852 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:02,853 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1498/2067], cost time 1.2971s, every example cost time is 1.2971, generate speed: 9.2512 tokens/s, avg speed: 10.2549 tokens/s, remaining time: 0:12:56 +pred is: + ['The Neutral Zone'] + label is: + ['The Neutral Zone'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:22:02,934 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:02,934 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 158, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:02,935 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:02,935 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:02,935 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:03,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:03,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:03,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:03,973 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:03,975 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.04007887840271 s; generated tokens: 4 tokens; generate speed: 3.8458621582076136 tokens/s +2024-07-30 14:22:03,980 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:03,981 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1499/2067], cost time 1.0514s, every example cost time is 1.0514, generate speed: 3.8045 tokens/s, avg speed: 10.2516 tokens/s, remaining time: 0:12:55 +pred is: + ['The Chase'] + label is: + ['The Chase'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:22:04,062 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:04,062 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 195, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:04,063 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:04,063 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:04,063 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:05,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:05,039 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:05,070 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:05,101 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:05,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:05,162 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:05,193 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:05,224 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:05,255 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:05,285 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:05,592 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5287487506866455 s; generated tokens: 20 tokens; generate speed: 13.082594501560113 tokens/s +2024-07-30 14:22:05,597 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:05,597 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1500/2067], cost time 1.5400s, every example cost time is 1.5400, generate speed: 12.9867 tokens/s, avg speed: 10.2536 tokens/s, remaining time: 0:12:53 +pred is: + ['5,6,7'] + label is: + ['the Fifth, Sixth and Seventh Doctors'] +The F1/Em of this example is: {'F1': 11.76470588235294, 'Em': 0.0} +F1 score: 64.42001719119813, Em score: 50.6, current_count: 1500 +2024-07-30 14:22:06,122 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:06,122 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 190, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:06,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:06,123 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:06,123 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:07,067 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:07,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:07,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:07,162 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:07,192 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:07,223 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:07,253 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:07,284 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:07,315 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:07,345 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:07,653 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5295467376708984 s; generated tokens: 20 tokens; generate speed: 13.075769119977853 tokens/s +2024-07-30 14:22:07,658 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:07,658 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1501/2067], cost time 1.5412s, every example cost time is 1.5412, generate speed: 12.9766 tokens/s, avg speed: 10.2557 tokens/s, remaining time: 0:12:52 +pred is: + ['1991'] + label is: + ['1991'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:22:07,741 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:07,741 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 164, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:07,741 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:07,742 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:07,742 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:08,685 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:08,718 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:08,749 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:08,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:08,782 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0402138233184814 s; generated tokens: 4 tokens; generate speed: 3.8453632419911834 tokens/s +2024-07-30 14:22:08,787 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:08,787 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1502/2067], cost time 1.0514s, every example cost time is 1.0514, generate speed: 3.8045 tokens/s, avg speed: 10.2524 tokens/s, remaining time: 0:12:51 +pred is: + ['1960'] + label is: + ['the early 1960s'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:22:08,869 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:08,869 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:08,870 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:08,870 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:08,870 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:09,813 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:09,846 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:09,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:09,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:09,941 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:09,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:10,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:10,034 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:10,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:10,095 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:10,405 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.534958839416504 s; generated tokens: 20 tokens; generate speed: 13.029665347640696 tokens/s +2024-07-30 14:22:10,410 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:10,411 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1503/2067], cost time 1.5463s, every example cost time is 1.5463, generate speed: 12.9344 tokens/s, avg speed: 10.2544 tokens/s, remaining time: 0:12:49 +pred is: + ['2006'] + label is: + ['2006'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:22:10,492 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:10,493 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 196, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:10,493 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:10,493 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:10,494 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:11,437 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:11,470 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:11,501 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:11,532 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:11,562 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:11,593 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:11,624 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:11,654 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:11,685 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:11,716 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:12,024 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5300140380859375 s; generated tokens: 20 tokens; generate speed: 13.071775488426365 tokens/s +2024-07-30 14:22:12,029 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:12,029 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1504/2067], cost time 1.5412s, every example cost time is 1.5412, generate speed: 12.9767 tokens/s, avg speed: 10.2565 tokens/s, remaining time: 0:12:48 +pred is: + ['Based on its over-all broadcast ratings, DVD and book sales, and iTunes traffic'] + label is: + ['Guinness World Records'] +The F1/Em of this example is: {'F1': 6.25, 'Em': 0.0} +2024-07-30 14:22:12,112 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:12,113 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 258, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:12,113 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:12,113 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:12,114 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:13,058 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:13,091 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:13,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:13,126 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.011780023574829 s; generated tokens: 3 tokens; generate speed: 2.965071389134939 tokens/s +2024-07-30 14:22:13,130 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:13,131 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1505/2067], cost time 1.0229s, every example cost time is 1.0229, generate speed: 2.9329 tokens/s, avg speed: 10.2528 tokens/s, remaining time: 0:12:47 +pred is: + ['11'] + label is: + ['Season 11'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:22:13,212 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:13,212 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 232, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:13,213 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:13,213 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:13,213 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:14,157 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:14,190 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:14,222 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:14,253 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:14,283 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:14,286 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0729072093963623 s; generated tokens: 5 tokens; generate speed: 4.66023525260222 tokens/s +2024-07-30 14:22:14,291 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:14,291 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1506/2067], cost time 1.0842s, every example cost time is 1.0842, generate speed: 4.6119 tokens/s, avg speed: 10.2498 tokens/s, remaining time: 0:12:45 +pred is: + ['Best Drama Series'] + label is: + ['Best Drama Series'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:22:14,373 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:14,374 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 224, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:14,374 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:14,374 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:14,375 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:15,318 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:15,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:15,382 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:15,413 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:15,444 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:15,474 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:15,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:15,536 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:15,566 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:15,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:15,905 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5300321578979492 s; generated tokens: 20 tokens; generate speed: 13.071620682454943 tokens/s +2024-07-30 14:22:15,910 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:15,910 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1507/2067], cost time 1.5413s, every example cost time is 1.5413, generate speed: 12.9758 tokens/s, avg speed: 10.2519 tokens/s, remaining time: 0:12:44 +pred is: + ['6'] + label is: + ['six'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:22:15,991 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:15,992 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:15,992 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:15,992 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:15,993 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:16,935 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:16,968 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:16,999 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:17,030 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:17,061 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:17,092 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:17,095 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1018221378326416 s; generated tokens: 6 tokens; generate speed: 5.445525002612857 tokens/s +2024-07-30 14:22:17,099 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:17,100 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1508/2067], cost time 1.1130s, every example cost time is 1.1130, generate speed: 5.3909 tokens/s, avg speed: 10.2492 tokens/s, remaining time: 0:12:42 +pred is: + ['Spike Milligan'] + label is: + ['Spike Milligan'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:22:17,182 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:17,182 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 194, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:17,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:17,183 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:17,183 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:18,126 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:18,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:18,189 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:18,220 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:18,251 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:18,282 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:18,312 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:18,343 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:18,374 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:18,405 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:18,714 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.530719518661499 s; generated tokens: 20 tokens; generate speed: 13.065750946645354 tokens/s +2024-07-30 14:22:18,719 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:18,719 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1509/2067], cost time 1.5420s, every example cost time is 1.5420, generate speed: 12.9703 tokens/s, avg speed: 10.2513 tokens/s, remaining time: 0:12:41 +pred is: + ['1'] + label is: + ['a private research university'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:22:18,801 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:18,801 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 231, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:18,802 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:18,802 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:18,802 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:19,746 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:19,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:19,811 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:19,841 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:19,872 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:19,903 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:19,934 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:19,965 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:19,996 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:20,026 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:20,333 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5307624340057373 s; generated tokens: 20 tokens; generate speed: 13.065384644737787 tokens/s +2024-07-30 14:22:20,338 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:20,339 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1510/2067], cost time 1.5424s, every example cost time is 1.5424, generate speed: 12.9671 tokens/s, avg speed: 10.2533 tokens/s, remaining time: 0:12:40 +pred is: + ['1'] + label is: + ['various academic disciplines'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 64.29554687867363, Em score: 50.52980132450331, current_count: 1510 +2024-07-30 14:22:20,863 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:20,864 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 179, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:20,865 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:20,865 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:20,865 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:21,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:21,841 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:21,872 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:21,903 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:21,934 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:21,964 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:21,995 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:22,026 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:22,056 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:22,087 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:22,150 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2849273681640625 s; generated tokens: 12 tokens; generate speed: 9.339049270268024 tokens/s +2024-07-30 14:22:22,155 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:22,155 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1511/2067], cost time 1.3003s, every example cost time is 1.3003, generate speed: 9.2286 tokens/s, avg speed: 10.2527 tokens/s, remaining time: 0:12:38 +pred is: + ['American Baptist Education Society'] + label is: + ['the American Baptist Education Society'] +The F1/Em of this example is: {'F1': 87.50000000000001, 'Em': 0.0} +2024-07-30 14:22:22,238 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:22,238 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 258, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:22,238 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:22,239 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:22,239 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:23,182 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:23,215 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:23,246 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:23,277 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:23,308 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:23,339 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:23,370 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:23,401 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:23,404 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.164595603942871 s; generated tokens: 8 tokens; generate speed: 6.869337281469283 tokens/s +2024-07-30 14:22:23,408 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:23,409 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1512/2067], cost time 1.1756s, every example cost time is 1.1756, generate speed: 6.8051 tokens/s, avg speed: 10.2507 tokens/s, remaining time: 0:12:37 +pred is: + ['Marshall Field'] + label is: + ['Marshall Field'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:22:23,490 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:23,491 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 377, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:23,491 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:23,491 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:23,492 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:24,438 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:24,471 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:24,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:24,533 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:24,565 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:24,596 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:24,626 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:24,657 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:24,688 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:24,719 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:25,029 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5367176532745361 s; generated tokens: 20 tokens; generate speed: 13.01475255222241 tokens/s +2024-07-30 14:22:25,033 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:25,033 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1513/2067], cost time 1.5479s, every example cost time is 1.5479, generate speed: 12.9207 tokens/s, avg speed: 10.2527 tokens/s, remaining time: 0:12:36 +pred is: + ['1'] + label is: + ['several regional colleges and universities'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:22:25,116 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:25,116 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 200, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:25,116 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:25,117 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:25,117 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:26,060 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:26,092 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:26,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:26,154 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:26,184 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:26,215 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:26,246 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:26,276 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:26,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:26,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:26,646 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5293052196502686 s; generated tokens: 20 tokens; generate speed: 13.0778341321386 tokens/s +2024-07-30 14:22:26,651 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:26,651 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1514/2067], cost time 1.5404s, every example cost time is 1.5404, generate speed: 12.9839 tokens/s, avg speed: 10.2547 tokens/s, remaining time: 0:12:34 +pred is: + ['Robert Maynard Hutchins'] + label is: + ['Robert Maynard Hutchins'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:22:26,734 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:26,734 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 169, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:26,734 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:26,735 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:26,735 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:27,678 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:27,712 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:27,743 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:27,775 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:27,806 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:27,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:27,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:27,899 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:27,930 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:27,960 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:27,994 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2589776515960693 s; generated tokens: 11 tokens; generate speed: 8.737248025058067 tokens/s +2024-07-30 14:22:27,999 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:27,999 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1515/2067], cost time 1.2701s, every example cost time is 1.2701, generate speed: 8.6610 tokens/s, avg speed: 10.2538 tokens/s, remaining time: 0:12:33 +pred is: + ['1950'] + label is: + ['1950s'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:22:28,081 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:28,081 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 208, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:28,082 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:28,082 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:28,082 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:29,026 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:29,059 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:29,090 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:29,121 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:29,152 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:29,182 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:29,213 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:29,243 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:29,274 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:29,305 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:29,616 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5339508056640625 s; generated tokens: 20 tokens; generate speed: 13.038227775069881 tokens/s +2024-07-30 14:22:29,621 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:29,622 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1516/2067], cost time 1.5453s, every example cost time is 1.5453, generate speed: 12.9426 tokens/s, avg speed: 10.2558 tokens/s, remaining time: 0:12:32 +pred is: + ['1962'] + label is: + ['1962'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:22:29,705 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:29,705 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 299, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:29,706 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:29,706 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:29,706 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:30,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:30,685 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:30,716 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:30,746 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:30,777 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:30,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:30,839 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:30,870 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:30,900 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:30,931 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:30,964 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2578811645507812 s; generated tokens: 11 tokens; generate speed: 8.744864228830675 tokens/s +2024-07-30 14:22:30,969 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:30,969 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1517/2067], cost time 1.2693s, every example cost time is 1.2693, generate speed: 8.6660 tokens/s, avg speed: 10.2548 tokens/s, remaining time: 0:12:30 +pred is: + ['2008'] + label is: + ['mid-2000s'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:22:31,051 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:31,052 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 209, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:31,053 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:31,053 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:31,053 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:31,996 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:32,030 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:32,061 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:32,092 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:32,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:32,154 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:32,156 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1031301021575928 s; generated tokens: 6 tokens; generate speed: 5.439068327720099 tokens/s +2024-07-30 14:22:32,161 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:32,161 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1518/2067], cost time 1.1149s, every example cost time is 1.1149, generate speed: 5.3815 tokens/s, avg speed: 10.2522 tokens/s, remaining time: 0:12:29 +pred is: + ['The Main Quadrangles'] + label is: + ['the Main Quadrangles'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:22:32,244 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:32,244 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 315, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:32,245 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:32,245 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:32,245 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:33,190 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:33,224 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:33,255 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:33,286 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:33,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:33,347 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:33,378 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:33,409 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:33,440 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:33,474 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:33,539 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.293785572052002 s; generated tokens: 12 tokens; generate speed: 9.27510729692824 tokens/s +2024-07-30 14:22:33,544 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:33,544 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1519/2067], cost time 1.3049s, every example cost time is 1.3049, generate speed: 9.1959 tokens/s, avg speed: 10.2515 tokens/s, remaining time: 0:12:27 +pred is: + ['1950s'] + label is: + ['the 1940s'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:22:33,626 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:33,626 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 175, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:33,626 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:33,627 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:33,627 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:34,569 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:34,602 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:34,632 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:34,663 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:34,694 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:34,724 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:34,755 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:34,786 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:34,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:34,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:35,155 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5282294750213623 s; generated tokens: 20 tokens; generate speed: 13.087039824120936 tokens/s +2024-07-30 14:22:35,160 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:35,160 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1520/2067], cost time 1.5394s, every example cost time is 1.5394, generate speed: 12.9923 tokens/s, avg speed: 10.2535 tokens/s, remaining time: 0:12:26 +pred is: + ['Singapore, London, and the downtown Streeterville neighborhood of Chicago'] + label is: + ['Singapore, London, and the downtown Streeterville neighborhood of Chicago'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.25906301762973, Em score: 50.526315789473685, current_count: 1520 +2024-07-30 14:22:35,682 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:35,682 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 224, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:35,683 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:35,684 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:35,684 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:36,628 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:36,661 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:36,692 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:36,723 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:36,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:36,784 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:36,815 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:36,846 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:36,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:36,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:37,216 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5315661430358887 s; generated tokens: 20 tokens; generate speed: 13.058528416119046 tokens/s +2024-07-30 14:22:37,221 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:37,221 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1521/2067], cost time 1.5442s, every example cost time is 1.5442, generate speed: 12.9518 tokens/s, avg speed: 10.2555 tokens/s, remaining time: 0:12:25 +pred is: + ['The Board of Trustees'] + label is: + ['a board of trustees'] +The F1/Em of this example is: {'F1': 85.71428571428571, 'Em': 0.0} +2024-07-30 14:22:37,303 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:37,303 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 134, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:37,303 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:37,304 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:37,304 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:38,246 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:38,279 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:38,310 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:38,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:38,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:38,402 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:38,433 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:38,464 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:38,494 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:38,525 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:38,832 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5278935432434082 s; generated tokens: 20 tokens; generate speed: 13.089917218672221 tokens/s +2024-07-30 14:22:38,837 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:38,837 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1522/2067], cost time 1.5391s, every example cost time is 1.5391, generate speed: 12.9943 tokens/s, avg speed: 10.2576 tokens/s, remaining time: 0:12:23 +pred is: + ['The Higher Learning Commission'] + label is: + ['The Higher Learning Commission'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:22:38,919 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:38,920 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 154, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:38,920 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:38,920 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:38,921 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:39,863 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:39,896 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:39,927 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:39,958 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:39,989 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:40,019 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:40,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:40,081 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:40,111 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:40,142 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:40,448 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5273847579956055 s; generated tokens: 20 tokens; generate speed: 13.094277584808491 tokens/s +2024-07-30 14:22:40,453 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:40,453 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1523/2067], cost time 1.5385s, every example cost time is 1.5385, generate speed: 12.9997 tokens/s, avg speed: 10.2596 tokens/s, remaining time: 0:12:22 +pred is: + ['78'] + label is: + ['50'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:22:40,536 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:40,536 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 209, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:40,536 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:40,537 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:40,537 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:41,480 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:41,513 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:41,544 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:41,575 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:41,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:41,636 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:41,667 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:41,698 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:41,728 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:41,759 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:41,913 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3761053085327148 s; generated tokens: 15 tokens; generate speed: 10.90032856278557 tokens/s +2024-07-30 14:22:41,918 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:41,918 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1524/2067], cost time 1.3872s, every example cost time is 1.3872, generate speed: 10.8129 tokens/s, avg speed: 10.2600 tokens/s, remaining time: 0:12:21 +pred is: + ['Common Core'] + label is: + ['the Common Core'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:22:42,000 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:42,000 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 256, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:42,001 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:42,001 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:42,001 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:42,945 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:42,978 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:43,009 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:43,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:43,071 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:43,101 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:43,132 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:43,163 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:43,193 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:43,224 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:43,257 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2559585571289062 s; generated tokens: 11 tokens; generate speed: 8.75825076995037 tokens/s +2024-07-30 14:22:43,262 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:43,262 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1525/2067], cost time 1.2671s, every example cost time is 1.2671, generate speed: 8.6812 tokens/s, avg speed: 10.2590 tokens/s, remaining time: 0:12:19 +pred is: + ['University of Chicago Laboratory Schools'] + label is: + ['University of Chicago Laboratory Schools'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:22:43,346 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:43,346 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 262, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:43,346 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:43,347 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:43,347 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:44,291 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:44,323 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:44,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:44,385 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:44,416 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:44,447 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:44,477 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:44,508 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:44,539 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:44,542 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1949949264526367 s; generated tokens: 9 tokens; generate speed: 7.531412728852881 tokens/s +2024-07-30 14:22:44,547 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:44,547 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1526/2067], cost time 1.2059s, every example cost time is 1.2059, generate speed: 7.4630 tokens/s, avg speed: 10.2574 tokens/s, remaining time: 0:12:18 +pred is: + ['6'] + label is: + ['six'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:22:44,629 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:44,629 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 232, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:44,630 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:44,630 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:44,630 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:45,574 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:45,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:45,637 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:45,668 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:45,699 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:45,729 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:45,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:45,791 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:45,822 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:45,852 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:45,855 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2243802547454834 s; generated tokens: 10 tokens; generate speed: 8.167397310796014 tokens/s +2024-07-30 14:22:45,859 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:45,860 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1527/2067], cost time 1.2353s, every example cost time is 1.2353, generate speed: 8.0952 tokens/s, avg speed: 10.2561 tokens/s, remaining time: 0:12:17 +pred is: + ['12'] + label is: + ['12'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:22:45,941 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:45,942 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 252, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:45,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:45,942 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:45,943 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:46,887 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:46,920 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:46,951 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:46,982 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:47,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:47,044 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:47,075 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:47,106 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:47,137 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:47,168 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:47,477 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5340003967285156 s; generated tokens: 20 tokens; generate speed: 13.037806276095482 tokens/s +2024-07-30 14:22:47,482 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:47,482 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1528/2067], cost time 1.5451s, every example cost time is 1.5451, generate speed: 12.9440 tokens/s, avg speed: 10.2581 tokens/s, remaining time: 0:12:15 +pred is: + ['1'] + label is: + ['shaping ideas about the free market'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:22:47,564 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:47,564 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 427, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:47,565 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:47,565 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:47,565 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:48,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:48,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:48,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:48,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:48,638 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:48,670 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:48,701 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:48,732 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:48,763 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:48,794 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:48,828 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2622733116149902 s; generated tokens: 11 tokens; generate speed: 8.714436009049633 tokens/s +2024-07-30 14:22:48,832 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:48,833 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1529/2067], cost time 1.2733s, every example cost time is 1.2733, generate speed: 8.6391 tokens/s, avg speed: 10.2571 tokens/s, remaining time: 0:12:14 +pred is: + ['1933'] + label is: + ['1933'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:22:48,914 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:48,915 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 276, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:48,915 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:48,915 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:48,915 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:49,860 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:49,893 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:49,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:49,955 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:49,986 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:50,017 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:50,048 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:50,079 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:50,110 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:50,141 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:50,174 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2585628032684326 s; generated tokens: 11 tokens; generate speed: 8.740128002697585 tokens/s +2024-07-30 14:22:50,179 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:50,179 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1530/2067], cost time 1.2696s, every example cost time is 1.2696, generate speed: 8.6639 tokens/s, avg speed: 10.2561 tokens/s, remaining time: 0:12:12 +pred is: + ['5792'] + label is: + ['5,792'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 64.20554906700097, Em score: 50.45751633986928, current_count: 1530 +2024-07-30 14:22:50,713 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:50,713 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 208, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:50,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:50,714 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:50,714 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:51,658 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:51,693 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:51,724 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:51,755 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:51,786 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:51,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:51,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:51,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:51,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:51,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:52,267 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5531666278839111 s; generated tokens: 20 tokens; generate speed: 12.876918445800438 tokens/s +2024-07-30 14:22:52,272 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:52,273 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1531/2067], cost time 1.5647s, every example cost time is 1.5647, generate speed: 12.7820 tokens/s, avg speed: 10.2580 tokens/s, remaining time: 0:12:11 +pred is: + ['1'] + label is: + ['the University Athletic Association'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:22:52,354 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:52,354 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 231, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:52,355 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:52,355 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:52,355 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:53,299 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:53,332 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:53,363 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:53,394 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:53,425 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:53,455 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:53,486 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:53,517 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:53,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:53,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:53,911 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5551505088806152 s; generated tokens: 20 tokens; generate speed: 12.860491563865313 tokens/s +2024-07-30 14:22:53,915 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:53,916 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1532/2067], cost time 1.5663s, every example cost time is 1.5663, generate speed: 12.7688 tokens/s, avg speed: 10.2599 tokens/s, remaining time: 0:12:10 +pred is: + ['400'] + label is: + ['over 400'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:22:53,999 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:53,999 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 160, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:53,999 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:53,999 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:54,000 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:54,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:54,975 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:55,006 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:55,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:55,068 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:55,098 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:55,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:55,160 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:55,190 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:55,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:55,530 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5298752784729004 s; generated tokens: 20 tokens; generate speed: 13.072961097824729 tokens/s +2024-07-30 14:22:55,534 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:55,535 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1533/2067], cost time 1.5410s, every example cost time is 1.5410, generate speed: 12.9787 tokens/s, avg speed: 10.2619 tokens/s, remaining time: 0:12:09 +pred is: + ['1'] + label is: + ['graduate and undergraduate students'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:22:55,617 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:55,617 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:55,618 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:55,618 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:55,618 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:56,561 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:56,594 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:56,625 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:56,656 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:56,687 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:56,717 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:56,748 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:56,778 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:56,781 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1633567810058594 s; generated tokens: 8 tokens; generate speed: 6.876652227945974 tokens/s +2024-07-30 14:22:56,786 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:56,787 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1534/2067], cost time 1.1745s, every example cost time is 1.1745, generate speed: 6.8115 tokens/s, avg speed: 10.2600 tokens/s, remaining time: 0:12:07 +pred is: + ['15'] + label is: + ['fifteen'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:22:56,868 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:56,868 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 230, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:56,869 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:56,869 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:56,869 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:57,813 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:57,846 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:57,877 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:57,908 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:57,939 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:57,970 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:58,001 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:58,031 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:58,062 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:58,093 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:58,401 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5310285091400146 s; generated tokens: 20 tokens; generate speed: 13.063114031256077 tokens/s +2024-07-30 14:22:58,405 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:58,406 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1535/2067], cost time 1.5422s, every example cost time is 1.5422, generate speed: 12.9685 tokens/s, avg speed: 10.2620 tokens/s, remaining time: 0:12:06 +pred is: + ['5'] + label is: + ['May'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:22:58,489 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:58,489 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 170, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:58,489 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:58,490 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:58,490 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:22:59,433 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:59,466 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:59,497 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:59,528 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:59,559 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:59,590 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:59,621 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:59,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:59,682 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:59,713 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:59,746 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2560582160949707 s; generated tokens: 11 tokens; generate speed: 8.75755586727382 tokens/s +2024-07-30 14:22:59,751 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:22:59,751 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1536/2067], cost time 1.2675s, every example cost time is 1.2675, generate speed: 8.6788 tokens/s, avg speed: 10.2610 tokens/s, remaining time: 0:12:04 +pred is: + ['Satya Nadella'] + label is: + ['Satya Nadella'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:22:59,833 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:22:59,833 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 182, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:22:59,834 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:22:59,834 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:22:59,834 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:00,778 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:00,811 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:00,842 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:00,873 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:00,904 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:00,935 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:00,965 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:00,996 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:01,027 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:01,030 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1953339576721191 s; generated tokens: 9 tokens; generate speed: 7.5292766027723825 tokens/s +2024-07-30 14:23:01,034 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:01,034 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1537/2067], cost time 1.2065s, every example cost time is 1.2065, generate speed: 7.4596 tokens/s, avg speed: 10.2594 tokens/s, remaining time: 0:12:03 +pred is: + ['Saul Alinsky'] + label is: + ['Saul Alinsky'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:23:01,117 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:01,117 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 172, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:01,118 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:01,118 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:01,118 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:02,061 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:02,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:02,124 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:02,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:02,186 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:02,188 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0701665878295898 s; generated tokens: 5 tokens; generate speed: 4.672169788201409 tokens/s +2024-07-30 14:23:02,193 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:02,193 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1538/2067], cost time 1.0812s, every example cost time is 1.0812, generate speed: 4.6247 tokens/s, avg speed: 10.2565 tokens/s, remaining time: 0:12:02 +pred is: + ['Allan Bloom'] + label is: + ['Allan Bloom'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:23:02,275 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:02,276 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 159, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:02,276 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:02,276 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:02,276 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:03,219 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:03,254 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:03,286 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:03,316 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:03,320 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.042940378189087 s; generated tokens: 4 tokens; generate speed: 3.8353103242060813 tokens/s +2024-07-30 14:23:03,324 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:03,325 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1539/2067], cost time 1.0540s, every example cost time is 1.0540, generate speed: 3.7951 tokens/s, avg speed: 10.2533 tokens/s, remaining time: 0:12:00 +pred is: + ['Philip Glass'] + label is: + ['Philip Glass'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:23:03,407 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:03,407 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 226, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:03,408 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:03,408 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:03,408 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:04,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:04,384 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:04,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:04,446 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:04,477 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:04,508 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:04,539 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:04,570 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:04,601 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:04,632 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:04,971 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.562694787979126 s; generated tokens: 20 tokens; generate speed: 12.798404495777428 tokens/s +2024-07-30 14:23:04,976 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:04,976 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1540/2067], cost time 1.5738s, every example cost time is 1.5738, generate speed: 12.7081 tokens/s, avg speed: 10.2551 tokens/s, remaining time: 0:11:59 +pred is: + ['Carl Sagan'] + label is: + ['Carl Sagan'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.14577277435811, Em score: 50.45454545454545, current_count: 1540 +2024-07-30 14:23:05,504 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:05,504 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 197, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:05,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:05,505 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:05,505 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:06,449 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:06,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:06,537 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:06,568 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:06,599 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:06,629 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:06,660 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:06,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:06,722 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:06,724 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2191517353057861 s; generated tokens: 9 tokens; generate speed: 7.382182003573682 tokens/s +2024-07-30 14:23:06,729 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:06,730 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1541/2067], cost time 1.2305s, every example cost time is 1.2305, generate speed: 7.3139 tokens/s, avg speed: 10.2534 tokens/s, remaining time: 0:11:57 +pred is: + ['Milton Friedman'] + label is: + ['Milton Friedman'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:23:06,812 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:06,813 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 149, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:06,813 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:06,813 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:06,814 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:07,756 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:07,789 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:07,820 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:07,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:07,881 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:07,912 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:07,915 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1007177829742432 s; generated tokens: 6 tokens; generate speed: 5.450988521133396 tokens/s +2024-07-30 14:23:07,919 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:07,919 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1542/2067], cost time 1.1118s, every example cost time is 1.1118, generate speed: 5.3966 tokens/s, avg speed: 10.2508 tokens/s, remaining time: 0:11:56 +pred is: + ['David Graeber'] + label is: + ['David Graeber and Donald Johanson'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:23:08,002 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:08,002 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 182, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:08,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:08,003 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:08,003 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:08,946 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:08,980 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:09,011 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:09,042 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:09,073 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:09,104 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:09,135 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:09,166 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:09,197 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:09,228 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:09,292 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2882814407348633 s; generated tokens: 12 tokens; generate speed: 9.314734824678483 tokens/s +2024-07-30 14:23:09,297 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:09,297 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1543/2067], cost time 1.2994s, every example cost time is 1.2994, generate speed: 9.2348 tokens/s, avg speed: 10.2502 tokens/s, remaining time: 0:11:55 +pred is: + ['A. A. Michelson'] + label is: + ['A. A. Michelson'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:23:09,409 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:09,410 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 181, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:09,410 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:09,411 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:09,411 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:10,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:10,388 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:10,419 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:10,450 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:10,481 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:10,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:10,542 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:10,573 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:10,604 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:10,634 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:10,637 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2264742851257324 s; generated tokens: 10 tokens; generate speed: 8.153452641671038 tokens/s +2024-07-30 14:23:10,642 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:10,642 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1544/2067], cost time 1.2380s, every example cost time is 1.2380, generate speed: 8.0772 tokens/s, avg speed: 10.2489 tokens/s, remaining time: 0:11:53 +pred is: + ['James Henry Breasted'] + label is: + ['James Henry Breasted'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:23:10,724 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:10,725 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:10,725 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:10,725 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:10,726 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:11,669 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:11,701 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:11,732 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:11,763 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:11,794 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:11,825 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:11,855 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:11,858 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.132211446762085 s; generated tokens: 7 tokens; generate speed: 6.182590734282632 tokens/s +2024-07-30 14:23:11,863 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:11,863 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1545/2067], cost time 1.1432s, every example cost time is 1.1432, generate speed: 6.1230 tokens/s, avg speed: 10.2467 tokens/s, remaining time: 0:11:52 +pred is: + ['Raghuram Rajan'] + label is: + ['Raghuram Rajan'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:23:11,945 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:11,945 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 267, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:11,946 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:11,946 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:11,946 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:12,890 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:12,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:12,955 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:12,985 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:12,988 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0419108867645264 s; generated tokens: 4 tokens; generate speed: 3.8390999180566263 tokens/s +2024-07-30 14:23:12,993 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:12,993 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1546/2067], cost time 1.0531s, every example cost time is 1.0531, generate speed: 3.7984 tokens/s, avg speed: 10.2435 tokens/s, remaining time: 0:11:50 +pred is: + ['大元'] + label is: + ['Yuán Cháo'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:23:13,075 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:13,075 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 210, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:13,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:13,076 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:13,076 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:14,020 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:14,052 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:14,083 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:14,114 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:14,144 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:14,175 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:14,178 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1019089221954346 s; generated tokens: 6 tokens; generate speed: 5.445096122867984 tokens/s +2024-07-30 14:23:14,183 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:14,183 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1547/2067], cost time 1.1130s, every example cost time is 1.1130, generate speed: 5.3910 tokens/s, avg speed: 10.2409 tokens/s, remaining time: 0:11:49 +pred is: + ['Mongol Empire'] + label is: + ['Mongol Empire'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:23:14,265 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:14,265 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 371, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:14,265 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:14,266 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:14,266 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:15,212 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:15,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:15,276 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:15,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:15,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:15,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:15,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:15,431 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:15,462 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:15,493 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:15,833 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5671417713165283 s; generated tokens: 20 tokens; generate speed: 12.762087238092283 tokens/s +2024-07-30 14:23:15,838 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:15,838 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1548/2067], cost time 1.5783s, every example cost time is 1.5783, generate speed: 12.6718 tokens/s, avg speed: 10.2427 tokens/s, remaining time: 0:11:47 +pred is: + ['1271'] + label is: + ['1271'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:23:15,920 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:15,920 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 268, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:15,921 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:15,921 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:15,921 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:16,866 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:16,898 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:16,930 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:16,961 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:17,011 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:17,042 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:17,073 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:17,104 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:17,135 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:17,166 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:17,474 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5525381565093994 s; generated tokens: 20 tokens; generate speed: 12.88213105497283 tokens/s +2024-07-30 14:23:17,479 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:17,479 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1549/2067], cost time 1.5637s, every example cost time is 1.5637, generate speed: 12.7905 tokens/s, avg speed: 10.2446 tokens/s, remaining time: 0:11:46 +pred is: + ['Mongol and Turkic tribes'] + label is: + ['Mongol and Turkic tribes'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:23:17,561 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:17,561 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 271, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:17,561 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:17,562 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:17,562 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:18,506 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:18,539 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:18,570 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:18,601 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:18,632 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:18,663 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:18,694 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:18,724 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:18,755 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:18,786 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:19,094 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5318684577941895 s; generated tokens: 20 tokens; generate speed: 13.055951311119072 tokens/s +2024-07-30 14:23:19,099 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:19,099 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1550/2067], cost time 1.5429s, every example cost time is 1.5429, generate speed: 12.9622 tokens/s, avg speed: 10.2466 tokens/s, remaining time: 0:11:45 +pred is: + ['Western Xia'] + label is: + ['the Jin'] +The F1/Em of this example is: {'F1': 33.33333333333333, 'Em': 0.0} +F1 score: 64.23730542312569, Em score: 50.58064516129032, current_count: 1550 +2024-07-30 14:23:19,627 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:19,627 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 355, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:19,628 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:19,628 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:19,628 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:20,575 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:20,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:20,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:20,670 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:20,701 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:20,704 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0758793354034424 s; generated tokens: 5 tokens; generate speed: 4.647361312247026 tokens/s +2024-07-30 14:23:20,709 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:20,709 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1551/2067], cost time 1.0874s, every example cost time is 1.0874, generate speed: 4.5981 tokens/s, avg speed: 10.2437 tokens/s, remaining time: 0:11:43 +pred is: + ['Jurchen'] + label is: + ['Han Chinese'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:23:20,792 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:20,792 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 299, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:20,793 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:20,793 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:20,793 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:21,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:21,772 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:21,803 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:21,834 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:21,865 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:21,896 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:21,927 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:21,958 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:21,988 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:22,019 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:22,174 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.380636215209961 s; generated tokens: 15 tokens; generate speed: 10.864556379696927 tokens/s +2024-07-30 14:23:22,179 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:22,179 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1552/2067], cost time 1.3918s, every example cost time is 1.3918, generate speed: 10.7778 tokens/s, avg speed: 10.2440 tokens/s, remaining time: 0:11:42 +pred is: + ['1'] + label is: + ['Möngke Khan'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:23:22,261 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:22,261 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:22,262 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:22,262 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:22,262 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:23,206 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:23,239 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:23,270 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:23,301 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:23,333 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:23,363 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:23,394 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:23,424 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:23,455 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:23,486 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:23,764 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5015268325805664 s; generated tokens: 19 tokens; generate speed: 12.653786524311434 tokens/s +2024-07-30 14:23:23,769 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:23,769 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1553/2067], cost time 1.5127s, every example cost time is 1.5127, generate speed: 12.5603 tokens/s, avg speed: 10.2457 tokens/s, remaining time: 0:11:41 +pred is: + ['Ogedei'] + label is: + ['Ogedei'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:23:23,851 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:23,852 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 189, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:23,852 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:23,852 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:23,853 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:24,796 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:24,829 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:24,861 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:24,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:24,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:24,975 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:25,005 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:25,036 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:25,067 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:25,097 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:25,283 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4301130771636963 s; generated tokens: 16 tokens; generate speed: 11.187926504198085 tokens/s +2024-07-30 14:23:25,288 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:25,288 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1554/2067], cost time 1.4414s, every example cost time is 1.4414, generate speed: 11.1007 tokens/s, avg speed: 10.2463 tokens/s, remaining time: 0:11:39 +pred is: + ['Mongol interests in China and satisfying the demands of his Chinese subjects'] + label is: + ['preserving Mongol interests in China and satisfying the demands of his Chinese subjects'] +The F1/Em of this example is: {'F1': 95.83333333333334, 'Em': 0.0} +2024-07-30 14:23:25,372 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:25,373 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 291, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:25,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:25,373 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:25,373 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:26,318 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:26,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:26,383 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:26,414 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:26,445 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:26,476 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:26,508 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:26,511 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1370973587036133 s; generated tokens: 7 tokens; generate speed: 6.156025204368243 tokens/s +2024-07-30 14:23:26,516 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:26,516 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1555/2067], cost time 1.1485s, every example cost time is 1.1485, generate speed: 6.0949 tokens/s, avg speed: 10.2440 tokens/s, remaining time: 0:11:38 +pred is: + ['Karakorum in Mongolia'] + label is: + ['Karakorum'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +2024-07-30 14:23:26,601 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:26,601 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 216, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:26,602 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:26,602 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:26,602 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:27,546 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:27,579 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:27,610 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:27,641 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:27,672 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:27,703 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:27,734 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:27,765 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:27,795 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:27,798 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1952118873596191 s; generated tokens: 9 tokens; generate speed: 7.530045588721669 tokens/s +2024-07-30 14:23:27,802 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:27,803 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1556/2067], cost time 1.2066s, every example cost time is 1.2066, generate speed: 7.4588 tokens/s, avg speed: 10.2424 tokens/s, remaining time: 0:11:37 +pred is: + ['Scientific, commercial, and cultural'] + label is: + ['commercial, scientific, and cultural'] +The F1/Em of this example is: {'F1': 55.55555555555556, 'Em': 0.0} +2024-07-30 14:23:27,914 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:27,914 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 285, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:27,914 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:27,915 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:27,915 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:28,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:28,893 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:28,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:28,955 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:28,986 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:29,017 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:29,048 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:29,079 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:29,109 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:29,140 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:29,450 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5350642204284668 s; generated tokens: 20 tokens; generate speed: 13.02877087084839 tokens/s +2024-07-30 14:23:29,455 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:29,455 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1557/2067], cost time 1.5466s, every example cost time is 1.5466, generate speed: 12.9312 tokens/s, avg speed: 10.2444 tokens/s, remaining time: 0:11:35 +pred is: + ['The Song Emperor'] + label is: + ['the Song Emperor'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:23:29,537 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:29,538 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 227, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:29,538 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:29,538 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:29,539 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:30,483 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:30,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:30,548 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:30,580 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:30,611 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:30,642 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:30,674 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:30,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:30,737 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:30,768 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:31,082 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5435514450073242 s; generated tokens: 20 tokens; generate speed: 12.957132115480025 tokens/s +2024-07-30 14:23:31,087 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:31,087 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1558/2067], cost time 1.5550s, every example cost time is 1.5550, generate speed: 12.8614 tokens/s, avg speed: 10.2463 tokens/s, remaining time: 0:11:34 +pred is: + ['Northern China'] + label is: + ['northern China'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:23:31,171 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:31,172 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 412, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:31,172 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:31,172 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:31,173 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:32,119 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:32,153 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:32,184 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:32,215 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:32,246 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:32,277 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:32,308 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:32,339 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:32,370 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:32,401 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:32,721 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.547816514968872 s; generated tokens: 20 tokens; generate speed: 12.921428222648352 tokens/s +2024-07-30 14:23:32,725 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:32,726 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1559/2067], cost time 1.5592s, every example cost time is 1.5592, generate speed: 12.8272 tokens/s, avg speed: 10.2482 tokens/s, remaining time: 0:11:33 +pred is: + ['1279'] + label is: + ['after 1279'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:23:32,808 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:32,808 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 282, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:32,809 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:32,809 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:32,809 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:33,754 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:33,787 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:33,818 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:33,849 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:33,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:33,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:33,941 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:33,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:34,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:34,034 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:34,220 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4108772277832031 s; generated tokens: 16 tokens; generate speed: 11.340462291775381 tokens/s +2024-07-30 14:23:34,225 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:34,225 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1560/2067], cost time 1.4220s, every example cost time is 1.4220, generate speed: 11.2519 tokens/s, avg speed: 10.2489 tokens/s, remaining time: 0:11:31 +pred is: + ['1253'] + label is: + ['1253'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.23240104363272, Em score: 50.51282051282051, current_count: 1560 +2024-07-30 14:23:34,756 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:34,757 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 200, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:34,757 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:34,757 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:34,757 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:35,701 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:35,732 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:35,764 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:35,795 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:35,825 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:35,828 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.070408582687378 s; generated tokens: 5 tokens; generate speed: 4.671113517650384 tokens/s +2024-07-30 14:23:35,833 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:35,833 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1561/2067], cost time 1.0818s, every example cost time is 1.0818, generate speed: 4.6219 tokens/s, avg speed: 10.2460 tokens/s, remaining time: 0:11:30 +pred is: + ['Buyantu Khan'] + label is: + ['Buyantu Khan'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:23:35,915 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:35,915 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 223, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:35,916 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:35,916 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:35,916 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:36,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:36,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:36,923 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:36,954 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:36,985 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:37,016 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:37,047 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:37,077 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:37,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:37,139 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:37,448 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5318231582641602 s; generated tokens: 20 tokens; generate speed: 13.056337405594332 tokens/s +2024-07-30 14:23:37,453 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:37,453 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1562/2067], cost time 1.5430s, every example cost time is 1.5430, generate speed: 12.9618 tokens/s, avg speed: 10.2480 tokens/s, remaining time: 0:11:29 +pred is: + ['Emperor Gegeen Khan'] + label is: + ['Gegeen Khan'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:23:37,535 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:37,536 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 357, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:37,536 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:37,536 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:37,537 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:38,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:38,515 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:38,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:38,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:38,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:38,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:38,670 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:38,701 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:38,732 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:38,763 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:39,043 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5062837600708008 s; generated tokens: 19 tokens; generate speed: 12.613825166054324 tokens/s +2024-07-30 14:23:39,048 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:39,048 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1563/2067], cost time 1.5176s, every example cost time is 1.5176, generate speed: 12.5200 tokens/s, avg speed: 10.2496 tokens/s, remaining time: 0:11:27 +pred is: + ['Shangdu'] + label is: + ['Shangdu'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:23:39,130 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:39,131 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 220, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:39,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:39,131 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:39,132 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:40,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:40,109 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:40,140 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:40,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:40,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:40,232 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:40,263 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:40,294 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:40,324 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:40,355 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:40,664 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5318341255187988 s; generated tokens: 20 tokens; generate speed: 13.056243927994773 tokens/s +2024-07-30 14:23:40,668 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:40,669 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1564/2067], cost time 1.5431s, every example cost time is 1.5431, generate speed: 12.9609 tokens/s, avg speed: 10.2516 tokens/s, remaining time: 0:11:26 +pred is: + ['His cultural contribution'] + label is: + ['his cultural contribution'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:23:40,751 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:40,751 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 320, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:40,752 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:40,752 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:40,752 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:41,697 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:41,731 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:41,762 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:41,792 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:41,823 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:41,855 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:41,886 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:41,916 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:41,952 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:41,984 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:42,231 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4783356189727783 s; generated tokens: 18 tokens; generate speed: 12.175854906687091 tokens/s +2024-07-30 14:23:42,236 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:42,236 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1565/2067], cost time 1.4896s, every example cost time is 1.4896, generate speed: 12.0839 tokens/s, avg speed: 10.2528 tokens/s, remaining time: 0:11:25 +pred is: + ['1332'] + label is: + ['1332'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:23:42,318 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:42,318 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 175, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:42,319 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:42,319 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:42,319 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:43,262 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:43,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:43,326 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:43,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:43,388 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:43,419 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:43,450 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:43,485 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:43,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:43,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:43,854 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5350828170776367 s; generated tokens: 20 tokens; generate speed: 13.028613034751011 tokens/s +2024-07-30 14:23:43,859 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:43,859 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1566/2067], cost time 1.5463s, every example cost time is 1.5463, generate speed: 12.9340 tokens/s, avg speed: 10.2548 tokens/s, remaining time: 0:11:23 +pred is: + ['The Yuan dynasty had problems with famine, bitterness among the populace, and struggle.'] + label is: + ['struggle, famine, and bitterness'] +The F1/Em of this example is: {'F1': 21.62162162162162, 'Em': 0.0} +2024-07-30 14:23:43,942 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:43,943 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 315, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:43,943 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:43,943 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:43,944 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:44,889 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:44,922 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:44,954 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:44,985 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:45,016 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:45,047 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:45,078 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:45,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:45,139 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:45,170 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:45,265 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.320805311203003 s; generated tokens: 13 tokens; generate speed: 9.842480106443142 tokens/s +2024-07-30 14:23:45,269 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:45,270 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1567/2067], cost time 1.3320s, every example cost time is 1.3320, generate speed: 9.7597 tokens/s, avg speed: 10.2545 tokens/s, remaining time: 0:11:22 +pred is: + ['1340s'] + label is: + ['From the late 1340s onwards'] +The F1/Em of this example is: {'F1': 20.0, 'Em': 0.0} +2024-07-30 14:23:45,352 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:45,352 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 260, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:45,353 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:45,353 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:45,353 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:46,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:46,332 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:46,364 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:46,395 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:46,425 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:46,456 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:46,487 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:46,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:46,548 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:46,579 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:46,887 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5332486629486084 s; generated tokens: 20 tokens; generate speed: 13.044198559115497 tokens/s +2024-07-30 14:23:46,891 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:46,892 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1568/2067], cost time 1.5444s, every example cost time is 1.5444, generate speed: 12.9499 tokens/s, avg speed: 10.2564 tokens/s, remaining time: 0:11:21 +pred is: + ['The political unity of China and much of central Asia promoted trade between East and West.'] + label is: + ['The political unity of China and much of central Asia'] +The F1/Em of this example is: {'F1': 74.50980392156863, 'Em': 0.0} +2024-07-30 14:23:46,976 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:46,976 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 193, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:46,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:46,977 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:46,977 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:47,920 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:47,956 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:47,988 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:48,019 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:48,049 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:48,080 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:48,110 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:48,141 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:48,172 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:48,203 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:48,513 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5357637405395508 s; generated tokens: 20 tokens; generate speed: 13.022836437702011 tokens/s +2024-07-30 14:23:48,518 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:48,518 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1569/2067], cost time 1.5471s, every example cost time is 1.5471, generate speed: 12.9271 tokens/s, avg speed: 10.2583 tokens/s, remaining time: 0:11:19 +pred is: + ['1'] + label is: + ['Western'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:23:48,600 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:48,600 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 228, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:48,600 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:48,600 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:48,601 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:49,544 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:49,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:49,610 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:49,642 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:49,672 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:49,703 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:49,734 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:49,765 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:49,796 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:49,827 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:50,138 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5375251770019531 s; generated tokens: 20 tokens; generate speed: 13.00791707294078 tokens/s +2024-07-30 14:23:50,143 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:50,143 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1570/2067], cost time 1.5487s, every example cost time is 1.5487, generate speed: 12.9138 tokens/s, avg speed: 10.2603 tokens/s, remaining time: 0:11:18 +pred is: + ['Marco Polo'] + label is: + ['Marco Polo'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.26348856917849, Em score: 50.50955414012739, current_count: 1570 +2024-07-30 14:23:50,684 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:50,685 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 261, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:50,685 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:50,685 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:50,685 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:51,630 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:51,663 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:51,694 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:51,725 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:51,756 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:51,787 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:51,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:51,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:51,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:51,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:51,973 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2877826690673828 s; generated tokens: 12 tokens; generate speed: 9.318342518687913 tokens/s +2024-07-30 14:23:51,978 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:51,978 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1571/2067], cost time 1.2993s, every example cost time is 1.2993, generate speed: 9.2355 tokens/s, avg speed: 10.2596 tokens/s, remaining time: 0:11:17 +pred is: + ['Guo Shoujing'] + label is: + ['Guo Shoujing'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:23:52,060 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:52,060 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 331, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:52,061 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:52,061 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:52,061 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:53,005 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:53,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:53,071 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:53,102 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:53,133 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:53,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:53,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:53,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:53,257 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:53,287 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:53,597 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5354111194610596 s; generated tokens: 20 tokens; generate speed: 13.025827250111453 tokens/s +2024-07-30 14:23:53,601 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:53,602 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1572/2067], cost time 1.5465s, every example cost time is 1.5465, generate speed: 12.9322 tokens/s, avg speed: 10.2616 tokens/s, remaining time: 0:11:15 +pred is: + ['1'] + label is: + ['non-native Chinese people'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:23:53,683 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:53,684 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 408, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:53,684 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:53,684 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:53,685 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:54,632 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:54,665 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:54,696 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:54,727 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:54,758 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:54,789 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:54,820 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:54,851 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:54,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:54,913 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:55,221 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5365195274353027 s; generated tokens: 20 tokens; generate speed: 13.016430733804734 tokens/s +2024-07-30 14:23:55,226 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:55,226 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1573/2067], cost time 1.5477s, every example cost time is 1.5477, generate speed: 12.9224 tokens/s, avg speed: 10.2635 tokens/s, remaining time: 0:11:14 +pred is: + ['Han Chinese, Khitans, Jurchens, Mongols, and Tibetan Buddhists'] + label is: + ['Han Chinese, Khitans, Jurchens, Mongols, and Tibetan Buddhists'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:23:55,319 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:55,319 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 199, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:55,320 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:55,320 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:55,320 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:56,263 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:56,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:56,327 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:56,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:56,388 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:56,391 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0707831382751465 s; generated tokens: 5 tokens; generate speed: 4.669479581135512 tokens/s +2024-07-30 14:23:56,396 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:56,396 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1574/2067], cost time 1.0824s, every example cost time is 1.0824, generate speed: 4.6192 tokens/s, avg speed: 10.2606 tokens/s, remaining time: 0:11:13 +pred is: + ['Mongols'] + label is: + ['the Privy Council'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:23:56,479 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:56,479 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 242, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:56,480 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:56,480 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:56,480 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:57,424 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:57,457 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:57,489 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:57,520 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:57,551 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:57,582 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:57,617 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:57,648 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:57,679 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:57,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:58,019 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5384116172790527 s; generated tokens: 20 tokens; generate speed: 13.000421847680443 tokens/s +2024-07-30 14:23:58,023 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:58,024 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1575/2067], cost time 1.5500s, every example cost time is 1.5500, generate speed: 12.9035 tokens/s, avg speed: 10.2625 tokens/s, remaining time: 0:11:11 +pred is: + ['1269'] + label is: + ['1269'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:23:58,106 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:58,106 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 229, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:58,107 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:58,107 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:58,107 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:23:59,051 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:59,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:59,115 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:59,146 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:59,177 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:59,208 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:59,238 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:59,269 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:59,300 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:59,331 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:59,333 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2260591983795166 s; generated tokens: 10 tokens; generate speed: 8.156213022354066 tokens/s +2024-07-30 14:23:59,338 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:23:59,338 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1576/2067], cost time 1.2372s, every example cost time is 1.2372, generate speed: 8.0825 tokens/s, avg speed: 10.2613 tokens/s, remaining time: 0:11:10 +pred is: + ['1290'] + label is: + ['1290'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:23:59,421 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:23:59,421 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 439, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:23:59,422 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:23:59,422 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:23:59,422 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:00,370 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:00,403 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:00,435 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:00,466 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:00,497 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:00,528 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:00,559 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:00,590 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:00,621 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:00,652 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:00,962 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5395777225494385 s; generated tokens: 20 tokens; generate speed: 12.990575082420216 tokens/s +2024-07-30 14:24:00,967 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:00,967 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1577/2067], cost time 1.5510s, every example cost time is 1.5510, generate speed: 12.8952 tokens/s, avg speed: 10.2632 tokens/s, remaining time: 0:11:09 +pred is: + ['Painting, poetry, and calligraphy'] + label is: + ['painting, mathematics, calligraphy, poetry, and theater'] +The F1/Em of this example is: {'F1': 58.333333333333336, 'Em': 0.0} +2024-07-30 14:24:01,050 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:01,051 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 343, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:01,051 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:01,051 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:01,052 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:01,998 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:02,031 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:02,062 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:02,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:02,125 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:02,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:02,186 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:02,217 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:02,248 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:02,279 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:02,588 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5360848903656006 s; generated tokens: 20 tokens; generate speed: 13.020113748557112 tokens/s +2024-07-30 14:24:02,593 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:02,593 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1578/2067], cost time 1.5474s, every example cost time is 1.5474, generate speed: 12.9247 tokens/s, avg speed: 10.2651 tokens/s, remaining time: 0:11:07 +pred is: + ['The western khanates'] + label is: + ['western'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +2024-07-30 14:24:02,675 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:02,676 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 162, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:02,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:02,676 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:02,677 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:03,619 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:03,653 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:03,684 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:03,715 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:03,746 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:03,776 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:03,807 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:03,838 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:03,869 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:03,900 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:04,209 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5323386192321777 s; generated tokens: 20 tokens; generate speed: 13.051945404875049 tokens/s +2024-07-30 14:24:04,214 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:04,214 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1579/2067], cost time 1.5436s, every example cost time is 1.5436, generate speed: 12.9571 tokens/s, avg speed: 10.2670 tokens/s, remaining time: 0:11:06 +pred is: + ['1249'] + label is: + ['1249'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:24:04,297 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:04,297 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 216, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:04,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:04,298 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:04,298 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:05,242 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:05,275 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:05,306 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:05,337 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:05,368 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:05,399 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:05,429 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:05,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:05,491 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:05,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:05,831 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5333373546600342 s; generated tokens: 20 tokens; generate speed: 13.04344405307619 tokens/s +2024-07-30 14:24:05,836 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:05,836 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1580/2067], cost time 1.5446s, every example cost time is 1.5446, generate speed: 12.9481 tokens/s, avg speed: 10.2689 tokens/s, remaining time: 0:11:05 +pred is: + ['1'] + label is: + ['applied mathematics to the construction of calendars'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 64.23123020270691, Em score: 50.50632911392405, current_count: 1580 +2024-07-30 14:24:06,376 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:06,377 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 166, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:06,377 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:06,377 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:06,378 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:07,320 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:07,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:07,384 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:07,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:07,446 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:07,476 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:07,507 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:07,538 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:07,568 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:07,599 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:07,907 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5289194583892822 s; generated tokens: 20 tokens; generate speed: 13.081133796982357 tokens/s +2024-07-30 14:24:07,911 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:07,912 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1581/2067], cost time 1.5407s, every example cost time is 1.5407, generate speed: 12.9814 tokens/s, avg speed: 10.2709 tokens/s, remaining time: 0:11:03 +pred is: + ['Non-Mongol physicians'] + label is: + ['non-Mongol physicians'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:24:07,995 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:07,995 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 228, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:07,995 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:07,996 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:07,996 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:08,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:08,973 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:09,004 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:09,035 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:09,066 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:09,097 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:09,128 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:09,158 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:09,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:09,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:09,229 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2334418296813965 s; generated tokens: 10 tokens; generate speed: 8.107394900481886 tokens/s +2024-07-30 14:24:09,234 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:09,234 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1582/2067], cost time 1.2447s, every example cost time is 1.2447, generate speed: 8.0340 tokens/s, avg speed: 10.2696 tokens/s, remaining time: 0:11:02 +pred is: + ['4'] + label is: + ['four'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:24:09,316 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:09,317 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 181, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:09,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:09,317 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:09,318 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:10,260 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:10,294 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:10,325 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:10,356 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:10,386 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:10,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:10,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:10,479 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:10,510 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:10,541 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:10,574 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2561235427856445 s; generated tokens: 11 tokens; generate speed: 8.757100416735945 tokens/s +2024-07-30 14:24:10,579 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:10,579 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1583/2067], cost time 1.2674s, every example cost time is 1.2674, generate speed: 8.6793 tokens/s, avg speed: 10.2687 tokens/s, remaining time: 0:11:00 +pred is: + ['Muslim medicine'] + label is: + ['Muslim medicine'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:24:10,662 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:10,662 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 209, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:10,663 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:10,663 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:10,663 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:11,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:11,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:11,670 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:11,701 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:11,732 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:11,763 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:11,793 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:11,824 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:11,855 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:11,885 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:12,193 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5297739505767822 s; generated tokens: 20 tokens; generate speed: 13.073827013761901 tokens/s +2024-07-30 14:24:12,198 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:12,198 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1584/2067], cost time 1.5409s, every example cost time is 1.5409, generate speed: 12.9791 tokens/s, avg speed: 10.2706 tokens/s, remaining time: 0:10:59 +pred is: + ['Through Kingdom of Qocho and Tibetan intermediaries'] + label is: + ['through Kingdom of Qocho and Tibetan intermediaries'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:24:12,283 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:12,283 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:12,284 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:12,284 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:12,284 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:13,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:13,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:13,292 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:13,323 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:13,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:13,385 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:13,416 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:13,447 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:13,479 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:13,510 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:13,760 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4759056568145752 s; generated tokens: 18 tokens; generate speed: 12.19590149064753 tokens/s +2024-07-30 14:24:13,765 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:13,765 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1585/2067], cost time 1.4871s, every example cost time is 1.4871, generate speed: 12.1037 tokens/s, avg speed: 10.2718 tokens/s, remaining time: 0:10:58 +pred is: + ['chao'] + label is: + ['chao'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:24:13,848 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:13,848 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 360, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:13,849 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:13,849 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:13,849 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:14,795 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:14,829 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:14,860 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:14,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:14,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:14,955 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:14,987 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:15,018 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:15,059 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:15,091 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:15,409 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5599639415740967 s; generated tokens: 20 tokens; generate speed: 12.820809165511099 tokens/s +2024-07-30 14:24:15,414 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:15,415 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1586/2067], cost time 1.5715s, every example cost time is 1.5715, generate speed: 12.7266 tokens/s, avg speed: 10.2736 tokens/s, remaining time: 0:10:57 +pred is: + ['Mongolian patrimonial feudalism'] + label is: + ['patrimonial feudalism'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:24:15,499 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:15,499 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 320, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:15,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:15,500 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:15,500 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:16,446 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:16,480 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:16,511 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:16,544 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:16,575 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:16,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:16,638 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:16,669 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:16,701 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:16,732 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:16,988 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.487522840499878 s; generated tokens: 18 tokens; generate speed: 12.100654531093554 tokens/s +2024-07-30 14:24:16,993 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:16,993 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1587/2067], cost time 1.4997s, every example cost time is 1.4997, generate speed: 12.0028 tokens/s, avg speed: 10.2748 tokens/s, remaining time: 0:10:55 +pred is: + ['Muslims'] + label is: + ['Central Asian Muslims'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +2024-07-30 14:24:17,076 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:17,077 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 274, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:17,077 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:17,077 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:17,078 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:18,022 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:18,056 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:18,088 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:18,120 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:18,152 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:18,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:18,215 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:18,246 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:18,277 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:18,308 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:18,624 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5460467338562012 s; generated tokens: 20 tokens; generate speed: 12.936219560527343 tokens/s +2024-07-30 14:24:18,629 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:18,629 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1588/2067], cost time 1.5580s, every example cost time is 1.5580, generate speed: 12.8372 tokens/s, avg speed: 10.2767 tokens/s, remaining time: 0:10:54 +pred is: + ['Forcing them to eat food the Mongol way'] + label is: + ['restricting Halal slaughter and other Islamic practices like circumcision'] +The F1/Em of this example is: {'F1': 6.25, 'Em': 0.0} +2024-07-30 14:24:18,713 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:18,713 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 171, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:18,713 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:18,714 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:18,714 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:19,657 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:19,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:19,729 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:19,762 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:19,794 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:19,827 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:19,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:19,891 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:19,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:19,956 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:20,275 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5606656074523926 s; generated tokens: 20 tokens; generate speed: 12.815045006756895 tokens/s +2024-07-30 14:24:20,280 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:20,280 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1589/2067], cost time 1.5727s, every example cost time is 1.5727, generate speed: 12.7169 tokens/s, avg speed: 10.2784 tokens/s, remaining time: 0:10:53 +pred is: + ['Frederick W. Mote'] + label is: + ['Frederick W. Mote'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:24:20,364 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:20,364 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:20,365 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:20,365 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:20,365 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:21,308 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:21,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:21,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:21,404 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:21,408 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0421006679534912 s; generated tokens: 4 tokens; generate speed: 3.8384007639639277 tokens/s +2024-07-30 14:24:21,412 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:21,413 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1590/2067], cost time 1.0540s, every example cost time is 1.0540, generate speed: 3.7949 tokens/s, avg speed: 10.2753 tokens/s, remaining time: 0:10:51 +pred is: + ['Northern China'] + label is: + ['Northern'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +F1 score: 64.24523714063538, Em score: 50.503144654088054, current_count: 1590 +2024-07-30 14:24:21,957 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:21,958 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 172, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:21,958 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:21,958 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:21,958 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:22,902 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:22,935 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:22,967 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:22,999 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:23,031 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:23,062 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:23,066 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1069777011871338 s; generated tokens: 6 tokens; generate speed: 5.420163381399228 tokens/s +2024-07-30 14:24:23,070 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:23,071 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1591/2067], cost time 1.1187s, every example cost time is 1.1187, generate speed: 5.3632 tokens/s, avg speed: 10.2728 tokens/s, remaining time: 0:10:50 +pred is: + ['The Uighurs'] + label is: + ['Uighurs'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:24:23,153 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:23,154 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 170, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:23,154 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:23,154 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:23,154 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:24,097 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:24,130 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:24,163 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:24,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:24,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:24,259 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:24,291 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:24,322 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:24,353 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:24,385 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:24,703 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5485551357269287 s; generated tokens: 20 tokens; generate speed: 12.915265035501317 tokens/s +2024-07-30 14:24:24,708 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:24,708 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1592/2067], cost time 1.5601s, every example cost time is 1.5601, generate speed: 12.8201 tokens/s, avg speed: 10.2746 tokens/s, remaining time: 0:10:48 +pred is: + ['Central Region'] + label is: + ['The Central Region'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:24:24,791 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:24,791 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 211, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:24,792 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:24,792 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:24,792 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:25,736 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:25,769 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:25,801 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:25,832 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:25,864 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:25,895 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:25,927 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:25,958 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:25,990 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:26,022 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:26,150 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3570382595062256 s; generated tokens: 14 tokens; generate speed: 10.316584592901652 tokens/s +2024-07-30 14:24:26,154 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:26,155 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1593/2067], cost time 1.3684s, every example cost time is 1.3684, generate speed: 10.2309 tokens/s, avg speed: 10.2746 tokens/s, remaining time: 0:10:47 +pred is: + ['Africa'] + label is: + ['in Africa'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:24:26,236 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:26,237 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 258, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:26,237 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:26,237 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:26,237 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:27,182 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:27,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:27,253 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:27,285 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:27,289 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0512464046478271 s; generated tokens: 4 tokens; generate speed: 3.80500706810029 tokens/s +2024-07-30 14:24:27,294 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:27,294 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1594/2067], cost time 1.0626s, every example cost time is 1.0626, generate speed: 3.7643 tokens/s, avg speed: 10.2714 tokens/s, remaining time: 0:10:46 +pred is: + ['Tropical'] + label is: + ['a warm and humid tropical climate on its Indian Ocean coastline'] +The F1/Em of this example is: {'F1': 9.09090909090909, 'Em': 0.0} +2024-07-30 14:24:27,378 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:27,378 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 250, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:27,378 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:27,379 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:27,379 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:28,324 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:28,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:28,389 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:28,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:28,453 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:28,485 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:28,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:28,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:28,579 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:28,610 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:28,706 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3271706104278564 s; generated tokens: 13 tokens; generate speed: 9.79527417037138 tokens/s +2024-07-30 14:24:28,711 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:28,711 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1595/2067], cost time 1.3389s, every example cost time is 1.3389, generate speed: 9.7098 tokens/s, avg speed: 10.2710 tokens/s, remaining time: 0:10:44 +pred is: + ['Since the Lower Paleolithic period'] + label is: + ['Lower Paleolithic period'] +The F1/Em of this example is: {'F1': 71.42857142857143, 'Em': 0.0} +2024-07-30 14:24:28,794 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:28,794 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 181, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:28,795 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:28,795 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:28,795 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:29,738 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:29,772 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:29,803 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:29,835 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:29,866 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:29,897 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:29,928 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:29,959 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:29,990 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:30,021 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:30,281 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4853625297546387 s; generated tokens: 18 tokens; generate speed: 12.118253718823343 tokens/s +2024-07-30 14:24:30,286 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:30,286 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1596/2067], cost time 1.4971s, every example cost time is 1.4971, generate speed: 12.0230 tokens/s, avg speed: 10.2722 tokens/s, remaining time: 0:10:43 +pred is: + ['Mount Kenya'] + label is: + ['Mount Kenya'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:24:30,369 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:30,369 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 176, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:30,370 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:30,370 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:30,370 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:31,313 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:31,347 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:31,378 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:31,410 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:31,413 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.042569637298584 s; generated tokens: 4 tokens; generate speed: 3.836674172062456 tokens/s +2024-07-30 14:24:31,418 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:31,418 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1597/2067], cost time 1.0539s, every example cost time is 1.0539, generate speed: 3.7953 tokens/s, avg speed: 10.2691 tokens/s, remaining time: 0:10:41 +pred is: + ['Kenia'] + label is: + ['both Kenia and Kegnia'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 14:24:31,501 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:31,501 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 214, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:31,501 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:31,501 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:31,502 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:32,445 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:32,478 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:32,509 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:32,540 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:32,571 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:32,602 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:32,633 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:32,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:32,695 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:32,725 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:33,036 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5343735218048096 s; generated tokens: 20 tokens; generate speed: 13.034635775306501 tokens/s +2024-07-30 14:24:33,052 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:33,052 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1598/2067], cost time 1.5562s, every example cost time is 1.5562, generate speed: 12.8516 tokens/s, avg speed: 10.2709 tokens/s, remaining time: 0:10:40 +pred is: + ['The "Big Five" game animals of Kenya, that is the lion, leopard, buffalo,'] + label is: + ['The "Big Five"'] +The F1/Em of this example is: {'F1': 36.84210526315789, 'Em': 0.0} +2024-07-30 14:24:33,135 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:33,136 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 237, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:33,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:33,136 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:33,137 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:34,081 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:34,114 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:34,146 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:34,177 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:34,208 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:34,238 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:34,241 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1043977737426758 s; generated tokens: 6 tokens; generate speed: 5.432825149281764 tokens/s +2024-07-30 14:24:34,256 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:34,256 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1599/2067], cost time 1.1260s, every example cost time is 1.1260, generate speed: 5.3288 tokens/s, avg speed: 10.2684 tokens/s, remaining time: 0:10:39 +pred is: + ['20 million years ago'] + label is: + ['more than 20 million years ago'] +The F1/Em of this example is: {'F1': 77.77777777777779, 'Em': 0.0} +2024-07-30 14:24:34,339 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:34,340 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 163, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:34,340 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:34,340 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:34,340 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:35,284 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:35,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:35,348 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:35,379 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:35,410 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:35,412 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0716078281402588 s; generated tokens: 5 tokens; generate speed: 4.665886034704823 tokens/s +2024-07-30 14:24:35,417 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:35,417 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1600/2067], cost time 1.0829s, every example cost time is 1.0829, generate speed: 4.6172 tokens/s, avg speed: 10.2656 tokens/s, remaining time: 0:10:37 +pred is: + ['Swahili'] + label is: + ['The Swahili'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +F1 score: 64.18441651073168, Em score: 50.25, current_count: 1600 +2024-07-30 14:24:35,976 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:35,976 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 174, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:35,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:35,977 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:35,977 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:36,923 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:36,958 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:36,991 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:37,022 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:37,055 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:37,059 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0811614990234375 s; generated tokens: 5 tokens; generate speed: 4.62465598758027 tokens/s +2024-07-30 14:24:37,064 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:37,064 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1601/2067], cost time 1.1015s, every example cost time is 1.1015, generate speed: 4.5392 tokens/s, avg speed: 10.2627 tokens/s, remaining time: 0:10:36 +pred is: + ['Kenyan Coast'] + label is: + ['the Kenyan Coast'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:24:37,161 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:37,162 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 182, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:37,162 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:37,162 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:37,163 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:38,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:38,141 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:38,172 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:38,203 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:38,235 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:38,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:38,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:38,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:38,358 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:38,389 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:38,706 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5436031818389893 s; generated tokens: 20 tokens; generate speed: 12.95669783225814 tokens/s +2024-07-30 14:24:38,711 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:38,711 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1602/2067], cost time 1.5628s, every example cost time is 1.5628, generate speed: 12.7971 tokens/s, avg speed: 10.2645 tokens/s, remaining time: 0:10:34 +pred is: + ['August 1914'] + label is: + ['August 1914'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:24:38,794 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:38,795 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 157, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:38,795 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:38,795 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:38,795 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:39,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:39,775 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:39,807 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:39,838 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:39,870 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:39,901 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:39,933 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:39,965 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:39,996 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:40,028 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:40,344 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5483639240264893 s; generated tokens: 20 tokens; generate speed: 12.91685997694289 tokens/s +2024-07-30 14:24:40,349 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:40,349 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1603/2067], cost time 1.5599s, every example cost time is 1.5599, generate speed: 12.8212 tokens/s, avg speed: 10.2663 tokens/s, remaining time: 0:10:33 +pred is: + ['Central highlands'] + label is: + ['The central highlands'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:24:40,433 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:40,433 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 281, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:40,434 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:40,434 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:40,434 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:41,380 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:41,414 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:41,446 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:41,481 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:41,523 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:41,555 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:41,587 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:41,619 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:41,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:41,682 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:41,813 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3781404495239258 s; generated tokens: 14 tokens; generate speed: 10.158616275167205 tokens/s +2024-07-30 14:24:41,817 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:41,818 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1604/2067], cost time 1.3899s, every example cost time is 1.3899, generate speed: 10.0726 tokens/s, avg speed: 10.2662 tokens/s, remaining time: 0:10:32 +pred is: + ['15 January 1954'] + label is: + ['15 January 1954'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:24:41,902 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:41,902 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 252, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:41,903 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:41,903 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:41,903 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:42,849 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:42,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:42,915 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:42,946 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:42,949 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0459752082824707 s; generated tokens: 4 tokens; generate speed: 3.824182416874053 tokens/s +2024-07-30 14:24:42,954 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:42,954 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1605/2067], cost time 1.0577s, every example cost time is 1.0577, generate speed: 3.7818 tokens/s, avg speed: 10.2631 tokens/s, remaining time: 0:10:30 +pred is: + ['1957'] + label is: + ['1957'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:24:43,036 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:43,036 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 151, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:43,036 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:43,037 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:43,037 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:43,980 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:44,014 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:44,046 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:44,077 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:44,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:44,170 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:44,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:44,233 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:44,265 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:44,296 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:44,610 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5734989643096924 s; generated tokens: 20 tokens; generate speed: 12.710526319776875 tokens/s +2024-07-30 14:24:44,615 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:44,616 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1606/2067], cost time 1.5848s, every example cost time is 1.5848, generate speed: 12.6202 tokens/s, avg speed: 10.2648 tokens/s, remaining time: 0:10:29 +pred is: + ['A system where voters line up behind their favoured candidates instead of a secret ballot'] + label is: + ['where voters were supposed to line up behind their favoured candidates instead of a secret ballot'] +The F1/Em of this example is: {'F1': 73.33333333333333, 'Em': 0.0} +2024-07-30 14:24:44,701 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:44,701 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 141, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:44,702 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:44,702 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:44,702 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:45,645 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:45,679 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:45,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:45,742 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:45,792 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:45,824 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:45,856 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:45,887 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:45,919 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:45,950 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:46,264 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5610039234161377 s; generated tokens: 20 tokens; generate speed: 12.812267605472464 tokens/s +2024-07-30 14:24:46,268 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:46,269 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1607/2067], cost time 1.5725s, every example cost time is 1.5725, generate speed: 12.7188 tokens/s, avg speed: 10.2666 tokens/s, remaining time: 0:10:28 +pred is: + ['Presidential representative democratic republic'] + label is: + ['a presidential representative democratic republic'] +The F1/Em of this example is: {'F1': 87.50000000000001, 'Em': 0.0} +2024-07-30 14:24:46,352 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:46,352 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 149, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:46,353 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:46,353 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:46,353 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:47,296 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:47,330 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:47,361 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:47,392 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:47,423 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:47,454 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:47,485 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:47,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:47,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:47,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:47,890 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5362548828125 s; generated tokens: 20 tokens; generate speed: 13.018673023440604 tokens/s +2024-07-30 14:24:47,894 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:47,895 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1608/2067], cost time 1.5478s, every example cost time is 1.5478, generate speed: 12.9212 tokens/s, avg speed: 10.2684 tokens/s, remaining time: 0:10:26 +pred is: + ['27/100'] + label is: + ['low'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:24:47,978 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:47,978 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 270, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:47,979 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:47,979 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:47,979 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:48,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:48,958 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:48,989 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:49,019 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:49,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:49,081 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:49,113 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:49,144 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:49,175 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:49,206 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:49,524 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5439832210540771 s; generated tokens: 20 tokens; generate speed: 12.953508643925549 tokens/s +2024-07-30 14:24:49,528 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:49,529 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1609/2067], cost time 1.5555s, every example cost time is 1.5555, generate speed: 12.8575 tokens/s, avg speed: 10.2703 tokens/s, remaining time: 0:10:25 +pred is: + ['Party of National Unity'] + label is: + ['Party of National Unity'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:24:49,612 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:49,612 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 143, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:49,612 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:49,613 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:49,613 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:50,556 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:50,590 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:50,621 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:50,652 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:50,683 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:50,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:50,745 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:50,776 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:50,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:50,839 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:51,175 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5616803169250488 s; generated tokens: 20 tokens; generate speed: 12.806718368186925 tokens/s +2024-07-30 14:24:51,179 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:51,180 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1610/2067], cost time 1.5729s, every example cost time is 1.5729, generate speed: 12.7150 tokens/s, avg speed: 10.2720 tokens/s, remaining time: 0:10:24 +pred is: + ['Programmes to avoid similar disasters in the future'] + label is: + ['programmes to avoid similar disasters in the future'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.28937872702113, Em score: 50.24844720496895, current_count: 1610 +2024-07-30 14:24:51,775 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:51,775 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:51,776 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:51,776 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:51,776 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:52,719 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:52,752 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:52,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:52,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:52,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:52,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:52,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:52,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:52,974 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:53,006 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:53,259 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4827218055725098 s; generated tokens: 18 tokens; generate speed: 12.139836301287701 tokens/s +2024-07-30 14:24:53,264 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:53,264 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1611/2067], cost time 1.4947s, every example cost time is 1.4947, generate speed: 12.0427 tokens/s, avg speed: 10.2732 tokens/s, remaining time: 0:10:22 +pred is: + ['28 February 2008'] + label is: + ['28 February 2008'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:24:53,349 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:53,349 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 241, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:53,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:53,350 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:53,350 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:54,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:54,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:54,360 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:54,393 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:54,425 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:54,457 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:54,490 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:54,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:54,553 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:54,585 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:54,901 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5510144233703613 s; generated tokens: 20 tokens; generate speed: 12.894786598141305 tokens/s +2024-07-30 14:24:54,906 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:54,906 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1612/2067], cost time 1.5630s, every example cost time is 1.5630, generate speed: 12.7959 tokens/s, avg speed: 10.2750 tokens/s, remaining time: 0:10:21 +pred is: + ['The new office of the PM will have power and authority to co-ordinate and supervise the functions'] + label is: + ['PM will have power and authority to co-ordinate and supervise the functions of the Government'] +The F1/Em of this example is: {'F1': 74.19354838709677, 'Em': 0.0} +2024-07-30 14:24:54,991 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:54,991 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 182, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:54,992 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:54,992 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:54,992 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:55,935 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:55,969 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:56,001 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:56,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:56,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:56,096 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:56,127 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:56,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:56,191 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:56,223 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:56,540 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5481698513031006 s; generated tokens: 20 tokens; generate speed: 12.91847918570816 tokens/s +2024-07-30 14:24:56,545 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:56,546 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1613/2067], cost time 1.5597s, every example cost time is 1.5597, generate speed: 12.8233 tokens/s, avg speed: 10.2768 tokens/s, remaining time: 0:10:20 +pred is: + ['The position of Prime Minister was eliminated and the powers of the President were reduced.'] + label is: + ['eliminate the position of Prime Minister and simultaneously reduce the powers of the President'] +The F1/Em of this example is: {'F1': 35.08771929824561, 'Em': 0.0} +2024-07-30 14:24:56,630 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:56,631 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 164, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:56,631 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:56,631 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:56,632 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:57,575 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:57,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:57,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:57,671 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:57,703 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:57,734 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:57,764 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:57,795 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:57,826 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:57,857 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:58,168 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.536329746246338 s; generated tokens: 20 tokens; generate speed: 13.018038639729081 tokens/s +2024-07-30 14:24:58,173 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:58,173 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1614/2067], cost time 1.5479s, every example cost time is 1.5479, generate speed: 12.9208 tokens/s, avg speed: 10.2787 tokens/s, remaining time: 0:10:19 +pred is: + ['December 2014'] + label is: + ['December 2014'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:24:58,256 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:58,256 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 154, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:58,256 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:58,257 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:58,257 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:24:59,200 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:59,233 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:59,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:59,303 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:59,334 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:59,366 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:59,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:59,430 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:59,462 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:59,494 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:59,848 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5908386707305908 s; generated tokens: 20 tokens; generate speed: 12.571985059185808 tokens/s +2024-07-30 14:24:59,853 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:24:59,853 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1615/2067], cost time 1.6022s, every example cost time is 1.6022, generate speed: 12.4832 tokens/s, avg speed: 10.2803 tokens/s, remaining time: 0:10:17 +pred is: + ['The result of the 2007 election was that President Mwai Kibaki was declared'] + label is: + ['h International Criminal Court trial dates in 2013 for both President Kenyatta and Deputy President William Ruto'] +The F1/Em of this example is: {'F1': 10.344827586206897, 'Em': 0.0} +2024-07-30 14:24:59,937 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:24:59,938 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 151, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:24:59,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:24:59,938 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:24:59,939 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:00,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:00,915 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:00,947 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:00,979 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:01,011 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:01,043 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:01,074 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:01,107 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:01,139 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:01,170 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:01,481 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5420358180999756 s; generated tokens: 20 tokens; generate speed: 12.969867343706104 tokens/s +2024-07-30 14:25:01,486 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:01,486 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1616/2067], cost time 1.5537s, every example cost time is 1.5537, generate speed: 12.8721 tokens/s, avg speed: 10.2821 tokens/s, remaining time: 0:10:16 +pred is: + ['Peacekeeping missions'] + label is: + ['in peacekeeping missions around the world'] +The F1/Em of this example is: {'F1': 42.857142857142854, 'Em': 0.0} +2024-07-30 14:25:01,568 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:01,569 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:01,569 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:01,569 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:01,569 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:02,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:02,546 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:02,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:02,610 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:02,613 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0437467098236084 s; generated tokens: 4 tokens; generate speed: 3.832347409915183 tokens/s +2024-07-30 14:25:02,618 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:02,619 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1617/2067], cost time 1.0551s, every example cost time is 1.0551, generate speed: 3.7913 tokens/s, avg speed: 10.2790 tokens/s, remaining time: 0:10:14 +pred is: + ['The police'] + label is: + ['Kenya’s armed forces'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 14:25:02,703 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:02,704 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 180, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:02,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:02,704 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:02,705 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:03,649 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:03,682 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:03,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:03,745 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:03,778 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:03,782 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0767781734466553 s; generated tokens: 5 tokens; generate speed: 4.643481938341598 tokens/s +2024-07-30 14:25:03,786 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:03,787 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1618/2067], cost time 1.0886s, every example cost time is 1.0886, generate speed: 4.5930 tokens/s, avg speed: 10.2762 tokens/s, remaining time: 0:10:13 +pred is: + ['0.519'] + label is: + ['0.519, ranked 145 out of 186 in the world'] +The F1/Em of this example is: {'F1': 10.526315789473683, 'Em': 0.0} +2024-07-30 14:25:03,870 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:03,871 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 190, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:03,871 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:03,872 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:03,872 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:04,815 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:04,849 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:04,881 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:04,913 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:04,945 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:04,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:05,010 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:05,042 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:05,075 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:05,107 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:05,331 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.459507942199707 s; generated tokens: 17 tokens; generate speed: 11.647761213534979 tokens/s +2024-07-30 14:25:05,336 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:05,337 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1619/2067], cost time 1.4716s, every example cost time is 1.4716, generate speed: 11.5519 tokens/s, avg speed: 10.2770 tokens/s, remaining time: 0:10:12 +pred is: + ['rapid expansion in telecommunication and financial activity'] + label is: + ['rapid expansion in telecommunication and financial activity'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:25:05,420 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:05,421 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 246, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:05,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:05,421 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:05,421 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:06,366 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:06,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:06,433 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:06,465 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:06,498 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:06,530 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:06,561 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:06,592 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:06,624 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:06,627 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2053420543670654 s; generated tokens: 9 tokens; generate speed: 7.466760134512995 tokens/s +2024-07-30 14:25:06,632 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:06,632 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1620/2067], cost time 1.2171s, every example cost time is 1.2171, generate speed: 7.3949 tokens/s, avg speed: 10.2754 tokens/s, remaining time: 0:10:10 +pred is: + ['61%'] + label is: + ['61%'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.26167241013715, Em score: 50.18518518518518, current_count: 1620 +2024-07-30 14:25:07,219 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:07,219 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 201, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:07,220 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:07,220 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:07,220 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:08,165 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:08,198 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:08,230 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:08,265 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:08,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:08,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:08,361 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:08,393 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:08,425 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:08,456 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:08,460 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.239623785018921 s; generated tokens: 10 tokens; generate speed: 8.066963639171675 tokens/s +2024-07-30 14:25:08,465 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:08,465 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1621/2067], cost time 1.2515s, every example cost time is 1.2515, generate speed: 7.9905 tokens/s, avg speed: 10.2742 tokens/s, remaining time: 0:10:09 +pred is: + ['24'] + label is: + ['24%'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:25:08,548 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:08,549 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 216, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:08,549 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:08,549 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:08,550 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:09,493 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:09,527 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:09,560 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:09,592 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:09,624 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:09,655 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:09,688 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:09,723 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:09,754 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:09,786 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:10,126 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5765531063079834 s; generated tokens: 20 tokens; generate speed: 12.685903138928548 tokens/s +2024-07-30 14:25:10,131 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:10,132 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1622/2067], cost time 1.5884s, every example cost time is 1.5884, generate speed: 12.5911 tokens/s, avg speed: 10.2758 tokens/s, remaining time: 0:10:08 +pred is: + ['ICRISAT'] + label is: + ['International Crops Research Institute for the Semi-Arid Tropics (ICRISAT)'] +The F1/Em of this example is: {'F1': 10.0, 'Em': 0.0} +2024-07-30 14:25:10,215 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:10,216 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 258, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:10,216 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:10,216 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:10,217 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:11,161 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:11,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:11,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:11,259 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:11,292 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:11,325 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:11,358 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:11,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:11,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:11,453 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:11,774 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5571112632751465 s; generated tokens: 20 tokens; generate speed: 12.84429730341366 tokens/s +2024-07-30 14:25:11,779 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:11,779 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1623/2067], cost time 1.5687s, every example cost time is 1.5687, generate speed: 12.7492 tokens/s, avg speed: 10.2776 tokens/s, remaining time: 0:10:06 +pred is: + ['1'] + label is: + ['the fertile highlands'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:25:11,863 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:11,863 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 204, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:11,864 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:11,864 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:11,864 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:12,807 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:12,841 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:12,873 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:12,905 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:12,908 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0436673164367676 s; generated tokens: 4 tokens; generate speed: 3.832638942509557 tokens/s +2024-07-30 14:25:12,913 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:12,913 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1624/2067], cost time 1.0553s, every example cost time is 1.0553, generate speed: 3.7903 tokens/s, avg speed: 10.2745 tokens/s, remaining time: 0:10:05 +pred is: + ['Kenya'] + label is: + ['Kenya'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:25:12,996 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:12,996 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 147, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:12,996 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:12,997 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:12,997 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:13,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:13,973 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:14,005 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:14,036 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:14,068 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:14,099 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:14,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:14,163 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:14,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:14,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:14,549 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5523340702056885 s; generated tokens: 20 tokens; generate speed: 12.883824676572322 tokens/s +2024-07-30 14:25:14,554 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:14,555 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1625/2067], cost time 1.5641s, every example cost time is 1.5641, generate speed: 12.7872 tokens/s, avg speed: 10.2763 tokens/s, remaining time: 0:10:03 +pred is: + ["Kenya's inclusion among the beneficiaries of the US Government's African Growth and Opportunity Act (AGOA)"] + label is: + ["Kenya's inclusion among the beneficiaries of the US Government's African Growth and Opportunity Act (AGOA)"] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:25:14,640 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:14,640 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 214, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:14,641 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:14,641 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:14,641 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:15,585 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:15,618 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:15,650 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:15,683 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:15,715 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:15,747 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:15,780 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:15,812 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:15,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:15,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:16,016 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.375159740447998 s; generated tokens: 14 tokens; generate speed: 10.180635447805573 tokens/s +2024-07-30 14:25:16,021 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:16,022 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1626/2067], cost time 1.3870s, every example cost time is 1.3870, generate speed: 10.0939 tokens/s, avg speed: 10.2761 tokens/s, remaining time: 0:10:02 +pred is: + ['Hydroelectric stations'] + label is: + ['hydroelectric stations at dams'] +The F1/Em of this example is: {'F1': 60.0, 'Em': 0.0} +2024-07-30 14:25:16,106 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:16,106 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 146, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:16,107 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:16,107 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:16,107 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:17,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:17,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:17,116 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:17,147 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:17,179 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:17,211 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:17,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:17,277 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:17,309 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:17,340 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:17,660 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5532469749450684 s; generated tokens: 20 tokens; generate speed: 12.876252342746275 tokens/s +2024-07-30 14:25:17,665 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:17,666 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1627/2067], cost time 1.5654s, every example cost time is 1.5654, generate speed: 12.7765 tokens/s, avg speed: 10.2779 tokens/s, remaining time: 0:10:01 +pred is: + ['Turkana'] + label is: + ['in Turkana'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:25:17,749 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:17,750 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 284, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:17,750 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:17,750 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:17,751 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:18,696 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:18,729 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:18,762 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:18,794 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:18,827 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:18,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:18,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:18,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:18,956 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:18,988 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:18,991 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2396893501281738 s; generated tokens: 10 tokens; generate speed: 8.06653699087282 tokens/s +2024-07-30 14:25:18,995 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:18,996 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1628/2067], cost time 1.2516s, every example cost time is 1.2516, generate speed: 7.9901 tokens/s, avg speed: 10.2766 tokens/s, remaining time: 0:09:59 +pred is: + ['474'] + label is: + ['$474 million'] +The F1/Em of this example is: {'F1': 40.0, 'Em': 0.0} +2024-07-30 14:25:19,079 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:19,079 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 232, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:19,080 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:19,080 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:19,080 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:20,025 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:20,058 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:20,090 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:20,122 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:20,154 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:20,187 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:20,219 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:20,251 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:20,283 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:20,315 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:20,541 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4611847400665283 s; generated tokens: 17 tokens; generate speed: 11.634394703044862 tokens/s +2024-07-30 14:25:20,546 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:20,547 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1629/2067], cost time 1.4729s, every example cost time is 1.4729, generate speed: 11.5420 tokens/s, avg speed: 10.2774 tokens/s, remaining time: 0:09:58 +pred is: + ['Kenya reveiled Vision 2030'] + label is: + ['Vision 2030'] +The F1/Em of this example is: {'F1': 60.0, 'Em': 0.0} +2024-07-30 14:25:20,630 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:20,631 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 175, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:20,631 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:20,631 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:20,632 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:21,576 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:21,609 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:21,641 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:21,674 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:21,706 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:21,709 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0773708820343018 s; generated tokens: 5 tokens; generate speed: 4.640927356936688 tokens/s +2024-07-30 14:25:21,714 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:21,714 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1630/2067], cost time 1.0890s, every example cost time is 1.0890, generate speed: 4.5914 tokens/s, avg speed: 10.2747 tokens/s, remaining time: 0:09:57 +pred is: + ['Agriculture'] + label is: + ['in agriculture'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +F1 score: 64.1557725794001, Em score: 50.0, current_count: 1630 +2024-07-30 14:25:22,288 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:22,289 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 231, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:22,289 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:22,289 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:22,290 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:23,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:23,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:23,299 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:23,302 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.012751579284668 s; generated tokens: 3 tokens; generate speed: 2.9622269284625315 tokens/s +2024-07-30 14:25:23,307 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:23,308 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1631/2067], cost time 1.0245s, every example cost time is 1.0245, generate speed: 2.9282 tokens/s, avg speed: 10.2713 tokens/s, remaining time: 0:09:55 +pred is: + ['English'] + label is: + ["Kenya's various ethnic groups typically speak their mother tongues within their own communities"] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:25:23,391 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:23,392 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 182, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:23,392 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:23,392 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:23,393 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:24,336 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:24,370 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:24,402 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:24,435 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:24,439 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0459890365600586 s; generated tokens: 4 tokens; generate speed: 3.824131860076459 tokens/s +2024-07-30 14:25:24,444 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:24,444 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1632/2067], cost time 1.0580s, every example cost time is 1.0580, generate speed: 3.7807 tokens/s, avg speed: 10.2682 tokens/s, remaining time: 0:09:54 +pred is: + ['Christianity'] + label is: + ['Christian'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:25:24,527 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:24,527 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 214, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:24,528 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:24,528 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:24,528 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:25,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:25,504 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:25,536 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:25,568 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:25,600 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:25,631 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:25,635 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1066365242004395 s; generated tokens: 6 tokens; generate speed: 5.421834422404488 tokens/s +2024-07-30 14:25:25,640 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:25,640 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1633/2067], cost time 1.1185s, every example cost time is 1.1185, generate speed: 5.3643 tokens/s, avg speed: 10.2658 tokens/s, remaining time: 0:09:52 +pred is: + ['2.4%'] + label is: + ['2.4%'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:25:25,722 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:25,722 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:25,723 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:25,723 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:25,723 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:26,666 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:26,699 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:26,703 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 0.9793753623962402 s; generated tokens: 2 tokens; generate speed: 2.0421179425083706 tokens/s +2024-07-30 14:25:26,708 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:26,708 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1634/2067], cost time 0.9909s, every example cost time is 0.9909, generate speed: 2.0183 tokens/s, avg speed: 10.2621 tokens/s, remaining time: 0:09:51 +pred is: + ['Nurses'] + label is: + ['Nurses'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:25:26,797 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:26,797 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 214, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:26,797 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:26,798 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:26,798 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:27,741 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:27,775 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:27,807 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:27,839 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:27,872 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:27,904 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:27,937 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:27,969 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:28,001 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:28,034 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:28,356 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5584731101989746 s; generated tokens: 20 tokens; generate speed: 12.833073518635521 tokens/s +2024-07-30 14:25:28,361 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:28,362 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1635/2067], cost time 1.5702s, every example cost time is 1.5702, generate speed: 12.7369 tokens/s, avg speed: 10.2638 tokens/s, remaining time: 0:09:50 +pred is: + ['1'] + label is: + ['Diseases of poverty'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:25:28,444 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:28,445 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:28,445 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:28,445 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:28,446 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:29,389 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:29,423 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:29,456 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:29,488 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:29,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:29,560 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:29,593 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:29,625 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:29,656 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:29,689 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:29,725 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2788560390472412 s; generated tokens: 11 tokens; generate speed: 8.601437272169505 tokens/s +2024-07-30 14:25:29,730 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:29,730 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1636/2067], cost time 1.2906s, every example cost time is 1.2906, generate speed: 8.5234 tokens/s, avg speed: 10.2628 tokens/s, remaining time: 0:09:48 +pred is: + ['British colonists'] + label is: + ['British colonists.'] +The F1/Em of this example is: {'F1': 85.71428571428571, 'Em': 0.0} +2024-07-30 14:25:29,813 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:29,813 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 208, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:29,813 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:29,814 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:29,814 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:30,758 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:30,791 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:30,824 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:30,857 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:30,890 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:30,922 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:30,955 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:30,987 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:31,020 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:31,051 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:31,380 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5662591457366943 s; generated tokens: 20 tokens; generate speed: 12.76927898837133 tokens/s +2024-07-30 14:25:31,385 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:31,386 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1637/2067], cost time 1.5780s, every example cost time is 1.5780, generate speed: 12.6746 tokens/s, avg speed: 10.2645 tokens/s, remaining time: 0:09:47 +pred is: + ['1'] + label is: + ['look at both the possibilities of setting up a second university in Kenya as well as the reforming of the entire education system'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:25:31,470 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:31,471 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 187, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:31,471 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:31,472 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:31,472 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:32,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:32,449 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:32,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:32,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:32,548 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:32,581 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:32,613 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:32,644 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:32,677 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:32,709 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:32,745 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.272994041442871 s; generated tokens: 11 tokens; generate speed: 8.64104594514212 tokens/s +2024-07-30 14:25:32,750 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:32,750 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1638/2067], cost time 1.2850s, every example cost time is 1.2850, generate speed: 8.5602 tokens/s, avg speed: 10.2635 tokens/s, remaining time: 0:09:45 +pred is: + ['1985'] + label is: + ['January 1985'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:25:32,833 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:32,833 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 247, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:32,834 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:32,834 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:32,834 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:33,778 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:33,812 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:33,844 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:33,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:33,908 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:33,939 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:33,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:34,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:34,035 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:34,067 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:34,394 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5596003532409668 s; generated tokens: 20 tokens; generate speed: 12.823798070087953 tokens/s +2024-07-30 14:25:34,399 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:34,399 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1639/2067], cost time 1.5714s, every example cost time is 1.5714, generate speed: 12.7274 tokens/s, avg speed: 10.2653 tokens/s, remaining time: 0:09:44 +pred is: + ['6'] + label is: + ['age six years'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:25:34,482 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:34,482 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 223, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:34,483 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:34,483 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:34,483 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:35,428 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:35,461 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:35,494 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:35,526 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:35,530 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0464892387390137 s; generated tokens: 4 tokens; generate speed: 3.822303996952585 tokens/s +2024-07-30 14:25:35,535 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:35,535 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1640/2067], cost time 1.0581s, every example cost time is 1.0581, generate speed: 3.7802 tokens/s, avg speed: 10.2622 tokens/s, remaining time: 0:09:43 +pred is: + ['85%'] + label is: + ['85%'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 64.03025828666856, Em score: 49.8780487804878, current_count: 1640 +2024-07-30 14:25:36,108 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:36,109 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 176, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:36,109 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:36,109 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:36,110 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:37,053 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:37,086 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:37,117 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:37,149 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:37,181 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:37,213 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:37,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:37,277 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:37,309 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:37,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:37,439 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3289341926574707 s; generated tokens: 13 tokens; generate speed: 9.782275203562858 tokens/s +2024-07-30 14:25:37,444 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:37,444 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1641/2067], cost time 1.3409s, every example cost time is 1.3409, generate speed: 9.6951 tokens/s, avg speed: 10.2619 tokens/s, remaining time: 0:09:41 +pred is: + ['Kenya National Library Service (KNLS)'] + label is: + ['the Kenya National Library Service'] +The F1/Em of this example is: {'F1': 70.0, 'Em': 0.0} +2024-07-30 14:25:37,527 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:37,527 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 213, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:37,528 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:37,528 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:37,528 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:38,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:38,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:38,537 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:38,571 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:38,603 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:38,635 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:38,667 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:38,700 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:38,732 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:38,764 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:39,095 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.566373348236084 s; generated tokens: 20 tokens; generate speed: 12.768347994762738 tokens/s +2024-07-30 14:25:39,100 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:39,100 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1642/2067], cost time 1.5783s, every example cost time is 1.5783, generate speed: 12.6718 tokens/s, avg speed: 10.2636 tokens/s, remaining time: 0:09:40 +pred is: + ['cricket, rallying, football, rugby union and boxing'] + label is: + ['cricket, rallying, football, rugby union and boxing'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:25:39,184 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:39,184 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 283, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:39,185 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:39,185 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:39,185 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:40,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:40,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:40,197 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:40,228 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:40,260 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:40,293 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:40,325 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:40,362 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:40,367 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1813621520996094 s; generated tokens: 8 tokens; generate speed: 6.771843829414861 tokens/s +2024-07-30 14:25:40,372 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:40,372 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1643/2067], cost time 1.1932s, every example cost time is 1.1932, generate speed: 6.7047 tokens/s, avg speed: 10.2617 tokens/s, remaining time: 0:09:39 +pred is: + ['6'] + label is: + ['six gold'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:25:40,455 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:40,455 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 314, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:40,456 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:40,456 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:40,456 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:41,401 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:41,435 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:41,468 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:41,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:41,532 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:41,564 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:41,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:41,629 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:41,632 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.175776481628418 s; generated tokens: 8 tokens; generate speed: 6.804014304589781 tokens/s +2024-07-30 14:25:41,637 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:41,637 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1644/2067], cost time 1.1876s, every example cost time is 1.1876, generate speed: 6.7362 tokens/s, avg speed: 10.2598 tokens/s, remaining time: 0:09:37 +pred is: + ['volleyball'] + label is: + ["women's volleyball within Africa"] +The F1/Em of this example is: {'F1': 20.0, 'Em': 0.0} +2024-07-30 14:25:41,720 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:41,720 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 191, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:41,721 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:41,721 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:41,721 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:42,665 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:42,698 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:42,730 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:42,763 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:42,796 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:42,828 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:42,860 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:42,893 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:42,925 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:42,956 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:43,295 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5731585025787354 s; generated tokens: 20 tokens; generate speed: 12.713277121927526 tokens/s +2024-07-30 14:25:43,300 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:43,300 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1645/2067], cost time 1.5849s, every example cost time is 1.5849, generate speed: 12.6195 tokens/s, avg speed: 10.2615 tokens/s, remaining time: 0:09:36 +pred is: + ['Safari Rally'] + label is: + ['the world famous Safari Rally'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:25:43,384 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:43,384 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 198, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:43,385 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:43,385 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:43,385 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:44,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:44,362 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:44,395 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:44,398 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.012622594833374 s; generated tokens: 3 tokens; generate speed: 2.962604246939253 tokens/s +2024-07-30 14:25:44,403 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:44,403 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1646/2067], cost time 1.0246s, every example cost time is 1.0246, generate speed: 2.9280 tokens/s, avg speed: 10.2581 tokens/s, remaining time: 0:09:34 +pred is: + ['3'] + label is: + ['three meals in a day'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:25:44,486 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:44,486 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 259, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:44,487 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:44,487 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:44,487 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:45,432 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:45,467 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:45,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:45,532 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:45,566 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:45,598 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:45,630 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:45,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:45,696 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:45,728 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:46,055 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5676708221435547 s; generated tokens: 20 tokens; generate speed: 12.757780343613847 tokens/s +2024-07-30 14:25:46,060 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:46,061 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1647/2067], cost time 1.5796s, every example cost time is 1.5796, generate speed: 12.6611 tokens/s, avg speed: 10.2598 tokens/s, remaining time: 0:09:33 +pred is: + ['The United Nations'] + label is: + ['the United Nations'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:25:46,145 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:46,146 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 180, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:46,146 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:46,146 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:46,147 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:47,090 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:47,124 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:47,157 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:47,190 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:47,222 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:47,255 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:47,289 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:47,321 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:47,355 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:47,388 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:47,718 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.571016550064087 s; generated tokens: 20 tokens; generate speed: 12.730610634995625 tokens/s +2024-07-30 14:25:47,723 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:47,723 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1648/2067], cost time 1.5831s, every example cost time is 1.5831, generate speed: 12.6336 tokens/s, avg speed: 10.2615 tokens/s, remaining time: 0:09:32 +pred is: + ['Hoesung Lee'] + label is: + ['Hoesung Lee'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:25:47,807 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:47,807 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 176, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:47,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:47,808 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:47,808 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:48,751 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:48,784 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:48,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:48,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:48,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:48,912 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:48,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:48,976 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:49,008 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:49,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:49,359 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5509169101715088 s; generated tokens: 20 tokens; generate speed: 12.89559735201307 tokens/s +2024-07-30 14:25:49,364 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:49,365 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1649/2067], cost time 1.5629s, every example cost time is 1.5629, generate speed: 12.7968 tokens/s, avg speed: 10.2632 tokens/s, remaining time: 0:09:30 +pred is: + ['1'] + label is: + ['representatives appointed by governments and organizations'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:25:49,449 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:49,449 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:49,449 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:49,450 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:49,450 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:50,393 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:50,427 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:50,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:50,492 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:50,524 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:50,556 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:50,589 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:50,621 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:50,653 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:50,686 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:51,010 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5596754550933838 s; generated tokens: 20 tokens; generate speed: 12.823180575604123 tokens/s +2024-07-30 14:25:51,015 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:51,015 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1650/2067], cost time 1.5716s, every example cost time is 1.5716, generate speed: 12.7257 tokens/s, avg speed: 10.2650 tokens/s, remaining time: 0:09:29 +pred is: + ['1989'] + label is: + ['1989'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 63.96946884250694, Em score: 49.81818181818182, current_count: 1650 +2024-07-30 14:25:51,596 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:51,597 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 162, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:51,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:51,598 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:51,598 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:52,541 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:52,575 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:52,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:52,640 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:52,672 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:52,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:52,736 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:52,769 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:52,802 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:52,834 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:53,155 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5565807819366455 s; generated tokens: 20 tokens; generate speed: 12.848674628448562 tokens/s +2024-07-30 14:25:53,160 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:53,160 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1651/2067], cost time 1.5722s, every example cost time is 1.5722, generate speed: 12.7213 tokens/s, avg speed: 10.2667 tokens/s, remaining time: 0:09:28 +pred is: + ['Carry out research'] + label is: + ['does not carry out research nor does it monitor climate related data'] +The F1/Em of this example is: {'F1': 35.71428571428571, 'Em': 0.0} +2024-07-30 14:25:53,243 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:53,243 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 156, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:53,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:53,244 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:53,244 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:54,188 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:54,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:54,252 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:54,285 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:54,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:54,349 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:54,381 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:54,413 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:54,444 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:54,476 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:54,801 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5561742782592773 s; generated tokens: 20 tokens; generate speed: 12.852030957851213 tokens/s +2024-07-30 14:25:54,805 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:54,806 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1652/2067], cost time 1.5677s, every example cost time is 1.5677, generate speed: 12.7579 tokens/s, avg speed: 10.2684 tokens/s, remaining time: 0:09:27 +pred is: + ['2'] + label is: + ['two'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:25:54,888 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:54,888 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 228, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:54,889 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:54,889 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:54,889 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:55,833 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:55,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:55,901 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:55,932 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:55,966 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:55,998 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:56,030 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:56,063 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:56,095 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:56,127 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:56,227 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3376789093017578 s; generated tokens: 13 tokens; generate speed: 9.718326206388157 tokens/s +2024-07-30 14:25:56,232 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:56,233 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1653/2067], cost time 1.3494s, every example cost time is 1.3494, generate speed: 9.6338 tokens/s, avg speed: 10.2680 tokens/s, remaining time: 0:09:25 +pred is: + ['substantially increasing the atmospheric concentrations of the greenhouse gases'] + label is: + ['substantially increasing the atmospheric concentrations'] +The F1/Em of this example is: {'F1': 69.23076923076924, 'Em': 0.0} +2024-07-30 14:25:56,318 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:56,318 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 305, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:56,319 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:56,319 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:56,319 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:57,264 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:57,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:57,330 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:57,364 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:57,397 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:57,429 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:57,462 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:57,495 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:57,527 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:57,531 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.211796522140503 s; generated tokens: 9 tokens; generate speed: 7.426989461978739 tokens/s +2024-07-30 14:25:57,536 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:57,537 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1654/2067], cost time 1.2239s, every example cost time is 1.2239, generate speed: 7.3538 tokens/s, avg speed: 10.2665 tokens/s, remaining time: 0:09:24 +pred is: + ['2001'] + label is: + ['2001'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:25:57,620 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:57,620 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 175, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:57,621 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:57,621 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:57,621 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:25:58,565 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:58,598 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:58,630 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:58,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:58,697 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:58,729 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:58,762 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:58,794 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:58,826 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:58,860 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:59,116 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4951071739196777 s; generated tokens: 18 tokens; generate speed: 12.039270705129411 tokens/s +2024-07-30 14:25:59,121 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:25:59,121 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1655/2067], cost time 1.5068s, every example cost time is 1.5068, generate speed: 11.9460 tokens/s, avg speed: 10.2676 tokens/s, remaining time: 0:09:22 +pred is: + ['1'] + label is: + ['Richard Lindzen'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:25:59,205 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:25:59,205 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 145, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:25:59,205 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:25:59,206 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:25:59,206 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:00,149 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:00,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:00,215 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:00,246 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:00,280 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:00,311 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:00,343 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:00,377 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:00,409 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:00,440 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:00,771 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5645058155059814 s; generated tokens: 20 tokens; generate speed: 12.783589425988641 tokens/s +2024-07-30 14:26:00,775 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:00,776 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1656/2067], cost time 1.5763s, every example cost time is 1.5763, generate speed: 12.6878 tokens/s, avg speed: 10.2693 tokens/s, remaining time: 0:09:21 +pred is: + ['1'] + label is: + ['the same procedures as for IPCC Assessment Reports'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:26:00,861 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:00,862 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 165, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:00,862 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:00,862 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:00,863 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:01,806 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:01,839 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:01,873 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:01,906 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:01,937 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:01,970 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:02,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:02,034 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:02,067 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:02,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:02,421 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5580921173095703 s; generated tokens: 20 tokens; generate speed: 12.836211529350988 tokens/s +2024-07-30 14:26:02,426 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:02,426 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1657/2067], cost time 1.5702s, every example cost time is 1.5702, generate speed: 12.7370 tokens/s, avg speed: 10.2710 tokens/s, remaining time: 0:09:20 +pred is: + ['1'] + label is: + ['the Data Distribution Centre and the National Greenhouse Gas Inventories Programme'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:26:02,510 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:02,510 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 151, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:02,510 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:02,511 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:02,511 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:03,456 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:03,490 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:03,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:03,553 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:03,586 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:03,617 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:03,648 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:03,682 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:03,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:03,745 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:04,071 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5593249797821045 s; generated tokens: 20 tokens; generate speed: 12.826062725420291 tokens/s +2024-07-30 14:26:04,076 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:04,076 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1658/2067], cost time 1.5719s, every example cost time is 1.5719, generate speed: 12.7236 tokens/s, avg speed: 10.2727 tokens/s, remaining time: 0:09:18 +pred is: + ['The date of 2035 has been correctly quoted by the IPCC from the WWF report,'] + label is: + ['the date'] +The F1/Em of this example is: {'F1': 18.181818181818183, 'Em': 0.0} +2024-07-30 14:26:04,161 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:04,161 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 168, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:04,162 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:04,162 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:04,162 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:05,106 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:05,140 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:05,174 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:05,206 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:05,238 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:05,272 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:05,304 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:05,335 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:05,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:05,401 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:05,722 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.559227466583252 s; generated tokens: 20 tokens; generate speed: 12.826864860087518 tokens/s +2024-07-30 14:26:05,727 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:05,727 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1659/2067], cost time 1.5712s, every example cost time is 1.5712, generate speed: 12.7292 tokens/s, avg speed: 10.2744 tokens/s, remaining time: 0:09:17 +pred is: + ['Chairman'] + label is: + ['IPCC chairman'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:26:05,811 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:05,811 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 336, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:05,811 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:05,812 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:05,812 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:06,761 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:06,801 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:06,833 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:06,867 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:06,900 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:06,932 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:06,966 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:06,999 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:07,031 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:07,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:07,068 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2557435035705566 s; generated tokens: 10 tokens; generate speed: 7.963409702352586 tokens/s +2024-07-30 14:26:07,073 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:07,073 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1660/2067], cost time 1.2674s, every example cost time is 1.2674, generate speed: 7.8902 tokens/s, avg speed: 10.2730 tokens/s, remaining time: 0:09:16 +pred is: + ['1999'] + label is: + ['1999'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 63.808885821242974, Em score: 49.63855421686747, current_count: 1660 +2024-07-30 14:26:07,655 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:07,656 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 382, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:07,656 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:07,656 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:07,657 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:08,604 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:08,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:08,674 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:08,706 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:08,738 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:08,772 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:08,805 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:08,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:08,871 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:08,903 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:09,037 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.379737377166748 s; generated tokens: 14 tokens; generate speed: 10.146858548362738 tokens/s +2024-07-30 14:26:09,041 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:09,042 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1661/2067], cost time 1.3918s, every example cost time is 1.3918, generate speed: 10.0591 tokens/s, avg speed: 10.2729 tokens/s, remaining time: 0:09:14 +pred is: + ['1000-1900'] + label is: + ['between 1000 and 1900'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:26:09,124 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:09,125 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 251, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:09,125 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:09,125 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:09,126 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:10,071 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:10,104 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:10,137 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:10,170 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:10,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:10,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:10,291 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:10,323 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:10,355 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:10,388 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:10,711 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5855779647827148 s; generated tokens: 20 tokens; generate speed: 12.61369698887104 tokens/s +2024-07-30 14:26:10,716 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:10,717 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1662/2067], cost time 1.5972s, every example cost time is 1.5972, generate speed: 12.5222 tokens/s, avg speed: 10.2745 tokens/s, remaining time: 0:09:13 +pred is: + ['1'] + label is: + ['Rep. Joe Barton'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:26:10,801 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:10,801 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 221, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:10,802 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:10,802 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:10,802 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:11,746 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:11,780 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:11,812 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:11,844 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:11,877 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:11,909 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:11,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:11,974 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:12,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:12,039 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:12,043 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2411179542541504 s; generated tokens: 10 tokens; generate speed: 8.057251903997713 tokens/s +2024-07-30 14:26:12,048 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:12,048 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1663/2067], cost time 1.2529s, every example cost time is 1.2529, generate speed: 7.9816 tokens/s, avg speed: 10.2732 tokens/s, remaining time: 0:09:12 +pred is: + ['2001'] + label is: + ['2001'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:26:12,133 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:12,133 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 164, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:12,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:12,134 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:12,134 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:13,078 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:13,111 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:13,143 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:13,174 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:13,206 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:13,237 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:13,268 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:13,300 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:13,332 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:13,363 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:13,679 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5445616245269775 s; generated tokens: 20 tokens; generate speed: 12.948657847254884 tokens/s +2024-07-30 14:26:13,684 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:13,684 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1664/2067], cost time 1.5570s, every example cost time is 1.5570, generate speed: 12.8455 tokens/s, avg speed: 10.2750 tokens/s, remaining time: 0:09:10 +pred is: + ['1'] + label is: + ['1 February 2007'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +2024-07-30 14:26:13,767 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:13,767 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 191, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:13,767 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:13,768 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:13,768 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:14,712 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:14,745 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:14,777 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:14,809 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:14,841 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:14,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:14,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:14,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:14,973 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:15,005 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:15,330 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5621824264526367 s; generated tokens: 20 tokens; generate speed: 12.802602091367447 tokens/s +2024-07-30 14:26:15,335 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:15,336 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1665/2067], cost time 1.5739s, every example cost time is 1.5739, generate speed: 12.7073 tokens/s, avg speed: 10.2767 tokens/s, remaining time: 0:09:09 +pred is: + ['Sea level rise'] + label is: + ['projected rises in sea levels'] +The F1/Em of this example is: {'F1': 28.57142857142857, 'Em': 0.0} +2024-07-30 14:26:15,420 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:15,420 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 164, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:15,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:15,421 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:15,421 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:16,365 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:16,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:16,431 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:16,464 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:16,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:16,555 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:16,588 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:16,621 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:16,654 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:16,686 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:17,014 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5933234691619873 s; generated tokens: 20 tokens; generate speed: 12.552378965784676 tokens/s +2024-07-30 14:26:17,019 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:17,020 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1666/2067], cost time 1.6050s, every example cost time is 1.6050, generate speed: 12.4614 tokens/s, avg speed: 10.2782 tokens/s, remaining time: 0:09:08 +pred is: + ['1'] + label is: + ['coordinating lead author of the Fifth Assessment Report'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:26:17,128 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:17,128 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 170, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:17,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:17,129 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:17,129 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:18,073 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:18,106 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:18,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:18,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:18,204 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:18,236 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:18,270 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:18,303 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:18,336 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:18,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:18,696 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5663890838623047 s; generated tokens: 20 tokens; generate speed: 12.76821972653515 tokens/s +2024-07-30 14:26:18,701 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:18,701 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1667/2067], cost time 1.5783s, every example cost time is 1.5783, generate speed: 12.6722 tokens/s, avg speed: 10.2799 tokens/s, remaining time: 0:09:06 +pred is: + ['1'] + label is: + ['the Montreal Protocol'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:26:18,784 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:18,785 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 240, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:18,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:18,785 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:18,785 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:19,731 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:19,766 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:19,799 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:19,832 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:19,866 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:19,899 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:19,931 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:19,965 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:19,998 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:20,031 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:20,359 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5730257034301758 s; generated tokens: 20 tokens; generate speed: 12.714350411685928 tokens/s +2024-07-30 14:26:20,364 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:20,364 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1668/2067], cost time 1.5849s, every example cost time is 1.5849, generate speed: 12.6190 tokens/s, avg speed: 10.2815 tokens/s, remaining time: 0:09:05 +pred is: + ['1'] + label is: + ['Sheldon Ungar'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:26:20,447 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:20,447 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 191, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:20,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:20,448 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:20,448 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:21,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:21,451 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:21,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:21,517 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:21,549 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:21,582 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:21,614 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:21,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:21,679 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:21,711 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:22,035 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5864717960357666 s; generated tokens: 20 tokens; generate speed: 12.6065903282841 tokens/s +2024-07-30 14:26:22,040 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:22,040 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1669/2067], cost time 1.5984s, every example cost time is 1.5984, generate speed: 12.5126 tokens/s, avg speed: 10.2831 tokens/s, remaining time: 0:09:04 +pred is: + ['1'] + label is: + ['other scientific bodies'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:26:22,123 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:22,123 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:22,124 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:22,124 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:22,124 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:23,068 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:23,101 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:23,133 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:23,165 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:23,198 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:23,230 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:23,264 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:23,296 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:23,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:23,361 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:23,366 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2417385578155518 s; generated tokens: 10 tokens; generate speed: 8.053225002203245 tokens/s +2024-07-30 14:26:23,371 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:23,371 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1670/2067], cost time 1.2535s, every example cost time is 1.2535, generate speed: 7.9775 tokens/s, avg speed: 10.2818 tokens/s, remaining time: 0:09:02 +pred is: + ['5'] + label is: + ['five'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 63.52374564381322, Em score: 49.40119760479042, current_count: 1670 +2024-07-30 14:26:23,955 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:23,956 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:23,956 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:23,956 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:23,957 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:24,900 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:24,933 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:24,967 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:25,000 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:25,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:25,065 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:25,097 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:25,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:25,162 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:25,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:25,519 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5623228549957275 s; generated tokens: 20 tokens; generate speed: 12.801451336417077 tokens/s +2024-07-30 14:26:25,524 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:25,524 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1671/2067], cost time 1.5744s, every example cost time is 1.5744, generate speed: 12.7036 tokens/s, avg speed: 10.2835 tokens/s, remaining time: 0:09:01 +pred is: + ['To conduct photosynthesis'] + label is: + ['to conduct photosynthesis'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:26:25,608 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:25,608 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 150, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:25,609 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:25,609 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:25,609 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:26,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:26,587 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:26,619 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:26,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:26,684 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:26,717 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:26,748 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:26,780 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:26,813 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:26,817 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2075741291046143 s; generated tokens: 9 tokens; generate speed: 7.452958607744663 tokens/s +2024-07-30 14:26:26,822 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:26,822 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1672/2067], cost time 1.2192s, every example cost time is 1.2192, generate speed: 7.3822 tokens/s, avg speed: 10.2819 tokens/s, remaining time: 0:09:00 +pred is: + ['They pinch in two to reproduce.'] + label is: + ['pinch in two'] +The F1/Em of this example is: {'F1': 58.82352941176471, 'Em': 0.0} +2024-07-30 14:26:26,905 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:26,906 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 185, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:26,906 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:26,906 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:26,906 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:27,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:27,884 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:27,916 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:27,948 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:27,981 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:28,014 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:28,017 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1107544898986816 s; generated tokens: 6 tokens; generate speed: 5.401733735550594 tokens/s +2024-07-30 14:26:28,022 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:28,022 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1673/2067], cost time 1.1223s, every example cost time is 1.1223, generate speed: 5.3464 tokens/s, avg speed: 10.2795 tokens/s, remaining time: 0:08:58 +pred is: + ['Plants and algae'] + label is: + ['plants and algae'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:26:28,105 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:28,106 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 221, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:28,106 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:28,107 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:28,107 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:29,051 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:29,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:29,117 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:29,149 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:29,182 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:29,215 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:29,247 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:29,279 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:29,312 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:29,343 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:29,380 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2731938362121582 s; generated tokens: 11 tokens; generate speed: 8.639689956971344 tokens/s +2024-07-30 14:26:29,385 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:29,385 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1674/2067], cost time 1.2851s, every example cost time is 1.2851, generate speed: 8.5595 tokens/s, avg speed: 10.2785 tokens/s, remaining time: 0:08:57 +pred is: + ['Cyanobacteria'] + label is: + ['Cyanobacteria'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:26:29,468 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:29,468 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 240, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:29,469 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:29,469 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:29,469 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:30,414 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:30,449 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:30,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:30,515 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:30,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:30,580 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:30,612 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:30,643 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:30,675 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:30,707 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:31,058 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.588484764099121 s; generated tokens: 20 tokens; generate speed: 12.590614938219202 tokens/s +2024-07-30 14:26:31,063 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:31,063 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1675/2067], cost time 1.6005s, every example cost time is 1.6005, generate speed: 12.4961 tokens/s, avg speed: 10.2801 tokens/s, remaining time: 0:08:56 +pred is: + ['1'] + label is: + ['eukaryotic'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:26:31,147 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:31,147 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 159, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:31,148 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:31,148 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:31,148 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:32,092 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:32,126 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:32,158 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:32,191 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:32,224 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:32,256 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:32,288 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:32,321 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:32,352 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:32,384 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:32,705 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5562117099761963 s; generated tokens: 20 tokens; generate speed: 12.85172182665681 tokens/s +2024-07-30 14:26:32,709 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:32,710 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1676/2067], cost time 1.5682s, every example cost time is 1.5682, generate speed: 12.7531 tokens/s, avg speed: 10.2818 tokens/s, remaining time: 0:08:54 +pred is: + ['A type of organelle'] + label is: + ['almost the same thing as chloroplast'] +The F1/Em of this example is: {'F1': 11.11111111111111, 'Em': 0.0} +2024-07-30 14:26:32,824 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:32,825 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 298, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:32,825 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:32,826 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:32,826 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:33,771 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:33,805 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:33,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:33,870 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:33,902 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:33,934 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:33,965 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:33,996 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:34,028 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:34,059 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:34,374 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5484604835510254 s; generated tokens: 20 tokens; generate speed: 12.916054502168995 tokens/s +2024-07-30 14:26:34,379 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:34,380 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1677/2067], cost time 1.5605s, every example cost time is 1.5605, generate speed: 12.8165 tokens/s, avg speed: 10.2835 tokens/s, remaining time: 0:08:53 +pred is: + ['1'] + label is: + ['glaucophyte'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:26:34,462 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:34,462 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 262, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:34,463 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:34,463 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:34,463 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:35,408 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:35,442 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:35,473 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:35,504 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:35,535 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:35,566 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:35,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:35,600 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1367194652557373 s; generated tokens: 7 tokens; generate speed: 6.158071726540859 tokens/s +2024-07-30 14:26:35,605 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:35,605 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1678/2067], cost time 1.1480s, every example cost time is 1.1480, generate speed: 6.0973 tokens/s, avg speed: 10.2814 tokens/s, remaining time: 0:08:52 +pred is: + ['phycoerytherin'] + label is: + ['chlorophyll a and phycobilins'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:26:35,688 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:35,688 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 242, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:35,688 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:35,689 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:35,689 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:36,633 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:36,667 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:36,699 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:36,730 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:36,761 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:36,792 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:36,824 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:36,855 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:36,886 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:36,917 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:37,235 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5462355613708496 s; generated tokens: 20 tokens; generate speed: 12.934639779121722 tokens/s +2024-07-30 14:26:37,240 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:37,240 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1679/2067], cost time 1.5577s, every example cost time is 1.5577, generate speed: 12.8392 tokens/s, avg speed: 10.2831 tokens/s, remaining time: 0:08:50 +pred is: + ['1'] + label is: + ['phycobilisomes'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:26:37,324 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:37,324 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 191, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:37,324 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:37,325 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:37,325 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:38,268 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:38,302 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:38,335 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:38,339 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.013906478881836 s; generated tokens: 3 tokens; generate speed: 2.9588527763512102 tokens/s +2024-07-30 14:26:38,344 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:38,344 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1680/2067], cost time 1.0254s, every example cost time is 1.0254, generate speed: 2.9256 tokens/s, avg speed: 10.2798 tokens/s, remaining time: 0:08:49 +pred is: + ['double'] + label is: + ['double'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 63.42535111053032, Em score: 49.345238095238095, current_count: 1680 +2024-07-30 14:26:38,923 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:38,924 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:38,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:38,924 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:38,924 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:39,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:39,902 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:39,934 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:39,966 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:39,998 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:40,030 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:40,061 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:40,092 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:40,130 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:40,134 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.209099292755127 s; generated tokens: 9 tokens; generate speed: 7.443557409989095 tokens/s +2024-07-30 14:26:40,139 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:40,139 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1681/2067], cost time 1.2210s, every example cost time is 1.2210, generate speed: 7.3713 tokens/s, avg speed: 10.2783 tokens/s, remaining time: 0:08:47 +pred is: + ['Chloroplasts with three membranes'] + label is: + ['chloroplasts derived from a green alga'] +The F1/Em of this example is: {'F1': 22.22222222222222, 'Em': 0.0} +2024-07-30 14:26:40,223 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:40,223 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 187, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:40,223 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:40,224 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:40,224 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:41,168 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:41,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:41,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:41,271 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:41,275 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0508098602294922 s; generated tokens: 4 tokens; generate speed: 3.8065878056439417 tokens/s +2024-07-30 14:26:41,280 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:41,280 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1682/2067], cost time 1.0625s, every example cost time is 1.0625, generate speed: 3.7646 tokens/s, avg speed: 10.2753 tokens/s, remaining time: 0:08:46 +pred is: + ['Algae'] + label is: + ['cryptomonads'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:26:41,364 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:41,365 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 214, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:41,365 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:41,365 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:41,366 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:42,310 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:42,344 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:42,377 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:42,410 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:42,442 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:42,476 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:42,509 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:42,541 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:42,574 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:42,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:42,933 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5672035217285156 s; generated tokens: 20 tokens; generate speed: 12.761584390737843 tokens/s +2024-07-30 14:26:42,938 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:42,938 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1683/2067], cost time 1.5794s, every example cost time is 1.5794, generate speed: 12.6632 tokens/s, avg speed: 10.2769 tokens/s, remaining time: 0:08:45 +pred is: + ['Helicosproidia'] + label is: + ['helicosproidia'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:26:43,022 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:43,022 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 265, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:43,022 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:43,023 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:43,023 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:43,968 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:44,001 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:44,033 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:44,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:44,095 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:44,098 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0750916004180908 s; generated tokens: 5 tokens; generate speed: 4.650766500320119 tokens/s +2024-07-30 14:26:44,103 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:44,103 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1684/2067], cost time 1.0867s, every example cost time is 1.0867, generate speed: 4.6010 tokens/s, avg speed: 10.2743 tokens/s, remaining time: 0:08:43 +pred is: + ['Fatty acids'] + label is: + ['fatty acids, isopentenyl pyrophosphate, iron-sulfur clusters'] +The F1/Em of this example is: {'F1': 37.5, 'Em': 0.0} +2024-07-30 14:26:44,186 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:44,187 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 233, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:44,187 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:44,187 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:44,187 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:45,132 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:45,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:45,203 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:45,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:45,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:45,269 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0810527801513672 s; generated tokens: 5 tokens; generate speed: 4.6251210780845575 tokens/s +2024-07-30 14:26:45,273 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:45,274 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1685/2067], cost time 1.0926s, every example cost time is 1.0926, generate speed: 4.5762 tokens/s, avg speed: 10.2715 tokens/s, remaining time: 0:08:42 +pred is: + ['Peridinin'] + label is: + ['Peridinin'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:26:45,356 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:45,356 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 205, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:45,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:45,357 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:45,357 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:46,301 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:46,334 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:46,366 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:46,397 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:46,428 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:46,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:46,493 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:46,524 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:46,555 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:46,587 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:46,902 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5441479682922363 s; generated tokens: 20 tokens; generate speed: 12.952126616543861 tokens/s +2024-07-30 14:26:46,906 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:46,907 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1686/2067], cost time 1.5559s, every example cost time is 1.5559, generate speed: 12.8542 tokens/s, avg speed: 10.2733 tokens/s, remaining time: 0:08:40 +pred is: + ['Dinoflagellate'] + label is: + ['fucoxanthin dinophyte'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:26:46,990 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:46,990 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 209, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:46,991 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:46,991 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:46,991 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:47,935 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:47,968 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:48,000 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:48,031 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:48,062 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:48,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:48,125 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:48,156 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:48,188 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:48,219 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:48,540 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5491583347320557 s; generated tokens: 20 tokens; generate speed: 12.910236191873327 tokens/s +2024-07-30 14:26:48,545 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:48,546 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1687/2067], cost time 1.5607s, every example cost time is 1.5607, generate speed: 12.8144 tokens/s, avg speed: 10.2750 tokens/s, remaining time: 0:08:39 +pred is: + ['1'] + label is: + ['a cryptophyte'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:26:48,628 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:48,628 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 284, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:48,629 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:48,629 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:48,629 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:49,574 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:49,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:49,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:49,670 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:49,673 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0435223579406738 s; generated tokens: 4 tokens; generate speed: 3.8331713446885316 tokens/s +2024-07-30 14:26:49,678 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:49,678 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1688/2067], cost time 1.0552s, every example cost time is 1.0552, generate speed: 3.7908 tokens/s, avg speed: 10.2720 tokens/s, remaining time: 0:08:38 +pred is: + ['Alga'] + label is: + ['heterokontophyte'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:26:49,770 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:49,771 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 196, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:49,772 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:49,772 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:49,772 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:50,717 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:50,750 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:50,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:50,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:50,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:50,877 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:50,908 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:50,911 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1391050815582275 s; generated tokens: 7 tokens; generate speed: 6.145174938930497 tokens/s +2024-07-30 14:26:50,916 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:50,916 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1689/2067], cost time 1.1513s, every example cost time is 1.1513, generate speed: 6.0801 tokens/s, avg speed: 10.2700 tokens/s, remaining time: 0:08:36 +pred is: + ['Dinophyte nucleus'] + label is: + ['the dinophyte nucleus'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:26:51,000 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:51,000 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 299, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:51,000 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:51,001 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:51,001 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:51,947 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:51,980 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:52,011 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:52,042 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:52,074 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:52,105 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:52,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:52,167 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:52,200 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:52,231 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:52,547 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5456106662750244 s; generated tokens: 20 tokens; generate speed: 12.939869293345845 tokens/s +2024-07-30 14:26:52,552 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:52,552 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1690/2067], cost time 1.5572s, every example cost time is 1.5572, generate speed: 12.8432 tokens/s, avg speed: 10.2717 tokens/s, remaining time: 0:08:35 +pred is: + ['1'] + label is: + ['first set of endosymbiotic events'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 63.248113661487075, Em score: 49.171597633136095, current_count: 1690 +2024-07-30 14:26:53,146 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:53,147 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 176, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:53,147 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:53,148 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:53,148 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:54,091 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:54,125 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:54,157 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:54,189 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:54,192 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0440831184387207 s; generated tokens: 4 tokens; generate speed: 3.8311126091009275 tokens/s +2024-07-30 14:26:54,197 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:54,197 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1691/2067], cost time 1.0561s, every example cost time is 1.0561, generate speed: 3.7877 tokens/s, avg speed: 10.2687 tokens/s, remaining time: 0:08:33 +pred is: + ['ctDNA'] + label is: + ['ctDNA, or cpDNA'] +The F1/Em of this example is: {'F1': 28.57142857142857, 'Em': 0.0} +2024-07-30 14:26:54,280 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:54,281 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 159, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:54,281 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:54,281 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:54,282 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:55,225 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:55,259 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:55,291 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:55,323 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:55,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:55,357 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0756182670593262 s; generated tokens: 5 tokens; generate speed: 4.648489295063472 tokens/s +2024-07-30 14:26:55,362 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:55,363 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1692/2067], cost time 1.0871s, every example cost time is 1.0871, generate speed: 4.5993 tokens/s, avg speed: 10.2661 tokens/s, remaining time: 0:08:32 +pred is: + ['Inverted repeats'] + label is: + ['The inverted repeat regions'] +The F1/Em of this example is: {'F1': 40.0, 'Em': 0.0} +2024-07-30 14:26:55,445 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:55,446 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 197, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:55,446 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:55,447 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:55,447 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:56,391 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:56,425 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:56,456 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:56,496 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:56,527 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:56,559 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:56,591 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:56,622 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:56,654 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:56,685 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:57,005 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5584123134613037 s; generated tokens: 20 tokens; generate speed: 12.833574162141405 tokens/s +2024-07-30 14:26:57,010 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:57,011 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1693/2067], cost time 1.5702s, every example cost time is 1.5702, generate speed: 12.7369 tokens/s, avg speed: 10.2677 tokens/s, remaining time: 0:08:31 +pred is: + ['By electron microscopy'] + label is: + ['electron microscopy'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:26:57,094 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:57,094 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 206, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:57,095 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:57,095 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:57,095 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:58,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:58,072 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:58,104 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:58,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:58,167 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:58,199 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:58,231 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:58,263 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:58,294 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:58,326 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:58,392 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2967352867126465 s; generated tokens: 12 tokens; generate speed: 9.254008989314388 tokens/s +2024-07-30 14:26:58,397 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:58,397 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1694/2067], cost time 1.3084s, every example cost time is 1.3084, generate speed: 9.1717 tokens/s, avg speed: 10.2671 tokens/s, remaining time: 0:08:29 +pred is: + ['A → G deamination gradients'] + label is: + ['A → G deamination'] +The F1/Em of this example is: {'F1': 87.50000000000001, 'Em': 0.0} +2024-07-30 14:26:58,488 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:26:58,489 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 255, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:26:58,489 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:58,489 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:26:58,490 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:26:59,435 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:59,471 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:59,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:59,534 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:59,566 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:59,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:59,629 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:59,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:59,697 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:59,729 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:26:59,927 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4368345737457275 s; generated tokens: 16 tokens; generate speed: 11.135589505122441 tokens/s +2024-07-30 14:26:59,932 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:26:59,932 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1695/2067], cost time 1.4486s, every example cost time is 1.4486, generate speed: 11.0454 tokens/s, avg speed: 10.2676 tokens/s, remaining time: 0:08:28 +pred is: + ['bacteriophage T4'] + label is: + ['bacteriophage T4'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:27:00,015 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:00,016 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 181, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:00,016 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:00,016 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:00,017 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:00,960 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:00,997 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:01,030 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:01,067 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:01,071 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0541865825653076 s; generated tokens: 4 tokens; generate speed: 3.7943947173622816 tokens/s +2024-07-30 14:27:01,076 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:01,076 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1696/2067], cost time 1.0658s, every example cost time is 1.0658, generate speed: 3.7531 tokens/s, avg speed: 10.2646 tokens/s, remaining time: 0:08:27 +pred is: + ['Genes'] + label is: + ['Endosymbiotic gene transfer'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:27:01,158 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:01,158 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 233, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:01,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:01,159 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:01,159 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:02,104 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:02,137 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:02,169 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:02,200 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:02,232 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:02,263 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:02,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:02,326 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:02,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:02,360 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.201005220413208 s; generated tokens: 9 tokens; generate speed: 7.493722630867111 tokens/s +2024-07-30 14:27:02,365 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:02,366 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1697/2067], cost time 1.2122s, every example cost time is 1.2122, generate speed: 7.4242 tokens/s, avg speed: 10.2631 tokens/s, remaining time: 0:08:25 +pred is: + ['Most became nonfunctional pseudogenes'] + label is: + ['nonfunctional pseudogenes'] +The F1/Em of this example is: {'F1': 60.0, 'Em': 0.0} +2024-07-30 14:27:02,448 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:02,449 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 184, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:02,449 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:02,449 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:02,450 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:03,393 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:03,427 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:03,463 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:03,496 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:03,499 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0494327545166016 s; generated tokens: 4 tokens; generate speed: 3.81158295544388 tokens/s +2024-07-30 14:27:03,504 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:03,504 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1698/2067], cost time 1.0610s, every example cost time is 1.0610, generate speed: 3.7699 tokens/s, avg speed: 10.2602 tokens/s, remaining time: 0:08:24 +pred is: + ['Ribosome'] + label is: + ['a ribosome'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:27:03,597 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:03,597 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 241, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:03,598 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:03,598 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:03,598 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:04,542 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:04,576 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:04,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:04,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:04,670 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:04,702 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:04,733 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:04,764 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:04,795 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:04,826 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:05,147 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5487585067749023 s; generated tokens: 20 tokens; generate speed: 12.913569102291824 tokens/s +2024-07-30 14:27:05,152 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:05,153 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1699/2067], cost time 1.5608s, every example cost time is 1.5608, generate speed: 12.8143 tokens/s, avg speed: 10.2619 tokens/s, remaining time: 0:08:22 +pred is: + ['lens-shaped'] + label is: + ['lens-shaped'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:27:05,235 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:05,235 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 159, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:05,235 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:05,236 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:05,236 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:06,179 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:06,213 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:06,245 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:06,276 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:06,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:06,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:06,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:06,401 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:06,432 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:06,464 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:06,601 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3646256923675537 s; generated tokens: 14 tokens; generate speed: 10.259223520634979 tokens/s +2024-07-30 14:27:06,606 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:06,606 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1700/2067], cost time 1.3760s, every example cost time is 1.3760, generate speed: 10.1742 tokens/s, avg speed: 10.2618 tokens/s, remaining time: 0:08:21 +pred is: + ['The fact that chloroplasts are surrounded by a double membrane'] + label is: + ['a double membrane'] +The F1/Em of this example is: {'F1': 41.66666666666667, 'Em': 0.0} +F1 score: 63.21885304891251, Em score: 49.0, current_count: 1700 +2024-07-30 14:27:07,194 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:07,194 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 180, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:07,194 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:07,195 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:07,195 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:08,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:08,172 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:08,204 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:08,235 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:08,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:08,299 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:08,330 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:08,362 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:08,394 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:08,425 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:08,617 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4223299026489258 s; generated tokens: 16 tokens; generate speed: 11.249148295484641 tokens/s +2024-07-30 14:27:08,622 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:08,623 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1701/2067], cost time 1.4343s, every example cost time is 1.4343, generate speed: 11.1550 tokens/s, avg speed: 10.2624 tokens/s, remaining time: 0:08:20 +pred is: + ['The chloroplast double membrane is sometimes compared to the mitochondrial double membrane.'] + label is: + ['the mitochondrial double membrane'] +The F1/Em of this example is: {'F1': 45.16129032258064, 'Em': 0.0} +2024-07-30 14:27:08,705 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:08,706 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 218, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:08,706 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:08,706 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:08,706 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:09,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:09,685 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:09,717 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:09,749 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:09,781 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:09,785 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.077876091003418 s; generated tokens: 5 tokens; generate speed: 4.638752117922379 tokens/s +2024-07-30 14:27:09,789 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:09,790 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1702/2067], cost time 1.0892s, every example cost time is 1.0892, generate speed: 4.5906 tokens/s, avg speed: 10.2597 tokens/s, remaining time: 0:08:18 +pred is: + ['Stromules'] + label is: + ['Stromules'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:27:09,874 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:09,874 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 198, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:09,875 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:09,875 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:09,875 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:10,819 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:10,853 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:10,886 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:10,918 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:10,950 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:10,982 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:11,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:11,044 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:11,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:11,107 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:11,420 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5443394184112549 s; generated tokens: 20 tokens; generate speed: 12.95052095515057 tokens/s +2024-07-30 14:27:11,424 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:11,425 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1703/2067], cost time 1.5562s, every example cost time is 1.5562, generate speed: 12.8517 tokens/s, avg speed: 10.2614 tokens/s, remaining time: 0:08:17 +pred is: + ['In the chloroplasts of C4 plants'] + label is: + ['in the chloroplasts of C4 plants'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:27:11,508 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:11,508 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:11,509 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:11,509 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:11,509 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:12,453 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:12,489 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:12,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:12,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:12,583 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:12,614 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:12,645 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:12,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:12,707 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:12,738 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:12,772 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2630548477172852 s; generated tokens: 11 tokens; generate speed: 8.70904380746431 tokens/s +2024-07-30 14:27:12,777 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:12,778 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1704/2067], cost time 1.2746s, every example cost time is 1.2746, generate speed: 8.6305 tokens/s, avg speed: 10.2606 tokens/s, remaining time: 0:08:16 +pred is: + ['To synthesize a small fraction of their proteins'] + label is: + ['synthesize a small fraction of their proteins'] +The F1/Em of this example is: {'F1': 92.85714285714286, 'Em': 0.0} +2024-07-30 14:27:12,861 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:12,861 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 169, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:12,861 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:12,862 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:12,862 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:13,805 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:13,839 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:13,871 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:13,903 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:13,935 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:13,967 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:13,971 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1085197925567627 s; generated tokens: 6 tokens; generate speed: 5.4126232479450875 tokens/s +2024-07-30 14:27:13,976 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:13,976 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1705/2067], cost time 1.1202s, every example cost time is 1.1202, generate speed: 5.3564 tokens/s, avg speed: 10.2582 tokens/s, remaining time: 0:08:14 +pred is: + ['Plastoglobulus'] + label is: + ['plastoglobulus, sometimes spelled plastoglobule(s)'] +The F1/Em of this example is: {'F1': 16.666666666666668, 'Em': 0.0} +2024-07-30 14:27:14,059 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:14,059 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 172, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:14,059 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:14,060 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:14,060 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:15,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:15,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:15,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:15,102 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:15,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:15,167 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:15,171 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1111085414886475 s; generated tokens: 6 tokens; generate speed: 5.400012488394054 tokens/s +2024-07-30 14:27:15,176 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:15,176 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1706/2067], cost time 1.1227s, every example cost time is 1.1227, generate speed: 5.3444 tokens/s, avg speed: 10.2558 tokens/s, remaining time: 0:08:13 +pred is: + ['Thylakoid'] + label is: + ['either to a thylakoid or to another plastoglobulus attached to a thylakoid'] +The F1/Em of this example is: {'F1': 8.333333333333332, 'Em': 0.0} +2024-07-30 14:27:15,260 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:15,261 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 178, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:15,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:15,261 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:15,262 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:16,205 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:16,239 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:16,271 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:16,303 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:16,307 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0448071956634521 s; generated tokens: 4 tokens; generate speed: 3.828457553319205 tokens/s +2024-07-30 14:27:16,311 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:16,312 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1707/2067], cost time 1.0564s, every example cost time is 1.0564, generate speed: 3.7864 tokens/s, avg speed: 10.2529 tokens/s, remaining time: 0:08:11 +pred is: + ['In algae'] + label is: + ['The chloroplasts of some hornworts and algae'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 14:27:16,395 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:16,395 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 232, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:16,395 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:16,396 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:16,396 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:17,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:17,374 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:17,406 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:17,437 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:17,469 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:17,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:17,532 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:17,563 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:17,594 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:17,625 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:17,942 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5459885597229004 s; generated tokens: 20 tokens; generate speed: 12.936706338619192 tokens/s +2024-07-30 14:27:17,947 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:17,948 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1708/2067], cost time 1.5581s, every example cost time is 1.5581, generate speed: 12.8365 tokens/s, avg speed: 10.2546 tokens/s, remaining time: 0:08:10 +pred is: + ['helical thylakoid model'] + label is: + ['the helical thylakoid model'] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +2024-07-30 14:27:18,030 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:18,030 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 182, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:18,031 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:18,031 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:18,031 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:18,975 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:19,008 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:19,041 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:19,073 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:19,105 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:19,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:19,168 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:19,200 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:19,231 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:19,263 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:19,578 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5465118885040283 s; generated tokens: 20 tokens; generate speed: 12.932328647887989 tokens/s +2024-07-30 14:27:19,583 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:19,583 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1709/2067], cost time 1.5583s, every example cost time is 1.5583, generate speed: 12.8348 tokens/s, avg speed: 10.2563 tokens/s, remaining time: 0:08:09 +pred is: + ['Red and blue light'] + label is: + ['light energy'] +The F1/Em of this example is: {'F1': 20.0, 'Em': 0.0} +2024-07-30 14:27:19,666 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:19,666 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 185, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:19,667 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:19,667 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:19,667 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:20,611 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:20,644 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:20,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:20,679 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0115420818328857 s; generated tokens: 3 tokens; generate speed: 2.965768853198954 tokens/s +2024-07-30 14:27:20,684 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:20,684 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1710/2067], cost time 1.0230s, every example cost time is 1.0230, generate speed: 2.9326 tokens/s, avg speed: 10.2531 tokens/s, remaining time: 0:08:07 +pred is: + ['2'] + label is: + ['two'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 63.13649236822474, Em score: 48.83040935672515, current_count: 1710 +2024-07-30 14:27:21,280 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:21,280 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 189, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:21,281 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:21,281 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:21,281 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:22,225 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:22,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:22,290 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:22,294 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0123541355133057 s; generated tokens: 3 tokens; generate speed: 2.9633898798456286 tokens/s +2024-07-30 14:27:22,298 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:22,299 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1711/2067], cost time 1.0242s, every example cost time is 1.0242, generate speed: 2.9291 tokens/s, avg speed: 10.2499 tokens/s, remaining time: 0:08:06 +pred is: + ['30'] + label is: + ['about thirty'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:27:22,381 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:22,381 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 208, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:22,382 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:22,382 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:22,382 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:23,326 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:23,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:23,391 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:23,423 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:23,455 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:23,487 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:23,519 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:23,551 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:23,582 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:23,614 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:23,936 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5530896186828613 s; generated tokens: 20 tokens; generate speed: 12.877556941602332 tokens/s +2024-07-30 14:27:23,940 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:23,941 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1712/2067], cost time 1.5646s, every example cost time is 1.5646, generate speed: 12.7826 tokens/s, avg speed: 10.2516 tokens/s, remaining time: 0:08:04 +pred is: + ['Pigments'] + label is: + ['e a third group of pigments found in cyanobacteria'] +The F1/Em of this example is: {'F1': 11.11111111111111, 'Em': 0.0} +2024-07-30 14:27:24,031 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:24,032 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 164, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:24,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:24,032 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:24,033 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:24,976 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:25,011 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:25,044 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:25,075 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:25,107 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:25,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:25,170 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:25,201 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:25,233 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:25,264 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:25,363 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3300306797027588 s; generated tokens: 13 tokens; generate speed: 9.774210624152895 tokens/s +2024-07-30 14:27:25,368 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:25,368 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1713/2067], cost time 1.3428s, every example cost time is 1.3428, generate speed: 9.6811 tokens/s, avg speed: 10.2513 tokens/s, remaining time: 0:08:03 +pred is: + ['1'] + label is: + ['an enzyme called rubisco'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:27:25,452 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:25,452 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 320, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:25,453 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:25,453 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:25,453 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:26,399 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:26,433 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:26,464 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:26,496 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:26,526 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:26,558 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:26,589 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:26,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:26,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:26,682 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:26,997 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5435051918029785 s; generated tokens: 20 tokens; generate speed: 12.957520393331407 tokens/s +2024-07-30 14:27:27,002 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:27,002 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1714/2067], cost time 1.5555s, every example cost time is 1.5555, generate speed: 12.8578 tokens/s, avg speed: 10.2530 tokens/s, remaining time: 0:08:02 +pred is: + ['1'] + label is: + ['light reactions'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:27:27,085 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:27,086 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 171, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:27,086 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:27,086 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:27,086 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:28,030 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:28,063 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:28,095 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:28,126 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:28,157 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:28,188 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:28,219 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:28,250 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:28,282 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:28,313 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:28,378 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.291320562362671 s; generated tokens: 12 tokens; generate speed: 9.292812605759288 tokens/s +2024-07-30 14:27:28,384 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:28,384 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1715/2067], cost time 1.3037s, every example cost time is 1.3037, generate speed: 9.2044 tokens/s, avg speed: 10.2524 tokens/s, remaining time: 0:08:00 +pred is: + ['The green parts of plants have chloroplasts.'] + label is: + ['All green parts'] +The F1/Em of this example is: {'F1': 42.105263157894726, 'Em': 0.0} +2024-07-30 14:27:28,468 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:28,469 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 216, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:28,469 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:28,469 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:28,469 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:29,414 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:29,449 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:29,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:29,514 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:29,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:29,548 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.078801155090332 s; generated tokens: 5 tokens; generate speed: 4.634774421965957 tokens/s +2024-07-30 14:27:29,553 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:29,554 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1716/2067], cost time 1.0904s, every example cost time is 1.0904, generate speed: 4.5855 tokens/s, avg speed: 10.2498 tokens/s, remaining time: 0:07:59 +pred is: + ['In the stems'] + label is: + ['in the stems'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:27:29,637 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:29,637 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:29,637 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:29,638 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:29,638 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:30,583 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:30,617 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:30,648 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:30,679 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:30,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:30,741 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:30,772 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:30,803 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:30,834 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:30,865 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:31,177 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5393016338348389 s; generated tokens: 20 tokens; generate speed: 12.992905068368117 tokens/s +2024-07-30 14:27:31,182 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:31,182 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1717/2067], cost time 1.5509s, every example cost time is 1.5509, generate speed: 12.8958 tokens/s, avg speed: 10.2516 tokens/s, remaining time: 0:07:58 +pred is: + ['When there is low light'] + label is: + ['low-light conditions'] +The F1/Em of this example is: {'F1': 16.666666666666664, 'Em': 0.0} +2024-07-30 14:27:31,265 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:31,266 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 164, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:31,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:31,266 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:31,266 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:32,210 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:32,243 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:32,274 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:32,277 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0102605819702148 s; generated tokens: 3 tokens; generate speed: 2.9695308849419684 tokens/s +2024-07-30 14:27:32,282 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:32,282 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1718/2067], cost time 1.0215s, every example cost time is 1.0215, generate speed: 2.9368 tokens/s, avg speed: 10.2484 tokens/s, remaining time: 0:07:56 +pred is: + ['2'] + label is: + ['two'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:27:32,364 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:32,364 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 157, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:32,365 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:32,365 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:32,365 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:33,308 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:33,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:33,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:33,405 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:33,436 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:33,469 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:33,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:33,532 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:33,563 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:33,601 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:33,853 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4877567291259766 s; generated tokens: 18 tokens; generate speed: 12.098752200283842 tokens/s +2024-07-30 14:27:33,858 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:33,858 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1719/2067], cost time 1.4992s, every example cost time is 1.4992, generate speed: 12.0066 tokens/s, avg speed: 10.2495 tokens/s, remaining time: 0:07:55 +pred is: + ['salicylic acid, jasmonic acid, nitric oxide and reactive oxygen species'] + label is: + ['salicylic acid, jasmonic acid, nitric oxide and reactive oxygen species'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:27:33,941 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:33,942 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 192, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:33,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:33,942 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:33,943 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:34,886 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:34,920 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:34,951 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:34,982 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:35,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:35,044 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:35,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:35,106 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:35,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:35,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:35,511 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5678937435150146 s; generated tokens: 20 tokens; generate speed: 12.7559664567336 tokens/s +2024-07-30 14:27:35,515 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:35,516 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1720/2067], cost time 1.5793s, every example cost time is 1.5793, generate speed: 12.6641 tokens/s, avg speed: 10.2511 tokens/s, remaining time: 0:07:53 +pred is: + ['Photosynthesis'] + label is: + ['photosynthesis'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.98446801779069, Em score: 48.72093023255814, current_count: 1720 +2024-07-30 14:27:36,113 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:36,114 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 241, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:36,114 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:36,115 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:36,115 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:37,060 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:37,093 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:37,151 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:37,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:37,215 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:37,246 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:37,278 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:37,309 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:37,340 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:37,371 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:37,686 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5709309577941895 s; generated tokens: 20 tokens; generate speed: 12.731304263099407 tokens/s +2024-07-30 14:27:37,691 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:37,691 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1721/2067], cost time 1.5828s, every example cost time is 1.5828, generate speed: 12.6359 tokens/s, avg speed: 10.2527 tokens/s, remaining time: 0:07:52 +pred is: + ['Use the potential energy stored in an H+, or hydrogen ion gradient to generate ATP energy'] + label is: + ['generate ATP energy'] +The F1/Em of this example is: {'F1': 27.027027027027028, 'Em': 0.0} +2024-07-30 14:27:37,774 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:37,774 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:37,775 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:37,775 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:37,775 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:38,718 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:38,752 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:38,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:38,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:38,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:38,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:38,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:38,941 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:38,973 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:38,976 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2004280090332031 s; generated tokens: 9 tokens; generate speed: 7.497325897325897 tokens/s +2024-07-30 14:27:38,981 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:38,981 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1722/2067], cost time 1.2117s, every example cost time is 1.2117, generate speed: 7.4277 tokens/s, avg speed: 10.2513 tokens/s, remaining time: 0:07:51 +pred is: + ['NADP+'] + label is: + ['NADP+'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:27:39,063 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:39,063 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 181, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:39,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:39,064 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:39,064 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:40,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:40,041 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:40,073 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:40,106 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:40,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:40,170 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:40,201 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:40,232 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:40,263 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:40,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:40,575 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5104222297668457 s; generated tokens: 19 tokens; generate speed: 12.579264013436104 tokens/s +2024-07-30 14:27:40,579 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:40,580 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1723/2067], cost time 1.5218s, every example cost time is 1.5218, generate speed: 12.4854 tokens/s, avg speed: 10.2527 tokens/s, remaining time: 0:07:49 +pred is: + ['1'] + label is: + ['The Calvin cycle'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:27:40,663 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:40,663 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 218, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:40,663 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:40,664 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:40,664 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:41,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:41,641 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:41,672 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:41,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:41,735 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:41,767 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:41,798 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:41,829 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:41,860 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:41,918 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:42,138 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4741694927215576 s; generated tokens: 17 tokens; generate speed: 11.531916841268519 tokens/s +2024-07-30 14:27:42,143 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:42,143 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1724/2067], cost time 1.4854s, every example cost time is 1.4854, generate speed: 11.4449 tokens/s, avg speed: 10.2535 tokens/s, remaining time: 0:07:48 +pred is: + ['Glucose monomers in the chloroplast can be linked together to make starch'] + label is: + ['glucose monomers in the chloroplast can be linked together'] +The F1/Em of this example is: {'F1': 85.0, 'Em': 0.0} +2024-07-30 14:27:42,227 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:42,227 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 204, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:42,228 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:42,228 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:42,228 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:43,172 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:43,228 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:43,259 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:43,291 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:43,321 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:43,352 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:43,383 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:43,414 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:43,444 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:43,476 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:43,786 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5576422214508057 s; generated tokens: 20 tokens; generate speed: 12.839919029269618 tokens/s +2024-07-30 14:27:43,791 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:43,791 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1725/2067], cost time 1.5689s, every example cost time is 1.5689, generate speed: 12.7481 tokens/s, avg speed: 10.2551 tokens/s, remaining time: 0:07:47 +pred is: + ['1'] + label is: + ['add O2 instead of CO2 to RuBP'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:27:43,874 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:43,874 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 168, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:43,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:43,875 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:43,875 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:44,818 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:44,852 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:44,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:44,914 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:44,945 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:44,976 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:44,979 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1041569709777832 s; generated tokens: 6 tokens; generate speed: 5.434009980199388 tokens/s +2024-07-30 14:27:44,984 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:44,984 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1726/2067], cost time 1.1153s, every example cost time is 1.1153, generate speed: 5.3798 tokens/s, avg speed: 10.2528 tokens/s, remaining time: 0:07:45 +pred is: + ['In the stroma'] + label is: + ['in their stroma'] +The F1/Em of this example is: {'F1': 40.00000000000001, 'Em': 0.0} +2024-07-30 14:27:45,066 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:45,067 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 178, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:45,067 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:45,067 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:45,067 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:46,010 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:46,044 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:46,075 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:46,107 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:46,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:46,169 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:46,173 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1050240993499756 s; generated tokens: 6 tokens; generate speed: 5.429745834076802 tokens/s +2024-07-30 14:27:46,177 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:46,178 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1727/2067], cost time 1.1163s, every example cost time is 1.1163, generate speed: 5.3748 tokens/s, avg speed: 10.2505 tokens/s, remaining time: 0:07:44 +pred is: + ['Chloroplasts'] + label is: + ['Chloroplasts'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:27:46,261 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:46,261 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 210, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:46,262 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:46,262 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:46,262 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:47,207 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:47,240 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:47,273 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:47,304 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:47,335 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:47,368 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:47,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:47,454 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:47,458 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1958444118499756 s; generated tokens: 8 tokens; generate speed: 6.689833493994399 tokens/s +2024-07-30 14:27:47,463 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:47,463 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1728/2067], cost time 1.2076s, every example cost time is 1.2076, generate speed: 6.6245 tokens/s, avg speed: 10.2487 tokens/s, remaining time: 0:07:43 +pred is: + ['They form etioplasts'] + label is: + ['proplastids may develop into an etioplast stage before becoming chloroplasts'] +The F1/Em of this example is: {'F1': 8.333333333333332, 'Em': 0.0} +2024-07-30 14:27:47,547 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:47,547 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 218, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:47,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:47,548 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:47,548 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:48,492 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:48,525 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:48,558 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:48,590 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:48,622 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:48,654 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:48,658 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1097209453582764 s; generated tokens: 6 tokens; generate speed: 5.4067646691690445 tokens/s +2024-07-30 14:27:48,663 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:48,663 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1729/2067], cost time 1.1214s, every example cost time is 1.1214, generate speed: 5.3505 tokens/s, avg speed: 10.2463 tokens/s, remaining time: 0:07:41 +pred is: + ['Chromoplasts'] + label is: + ['chromoplasts'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:27:48,746 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:48,747 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 195, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:48,747 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:48,747 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:48,748 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:49,692 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:49,725 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:49,758 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:49,791 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:49,822 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:49,858 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:49,891 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:49,922 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:49,954 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:49,987 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:50,303 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5556862354278564 s; generated tokens: 20 tokens; generate speed: 12.856062838724963 tokens/s +2024-07-30 14:27:50,308 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:50,309 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1730/2067], cost time 1.5673s, every example cost time is 1.5673, generate speed: 12.7611 tokens/s, avg speed: 10.2480 tokens/s, remaining time: 0:07:40 +pred is: + ['1'] + label is: + ['filaments'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 62.886500202867246, Em score: 48.61271676300578, current_count: 1730 +2024-07-30 14:27:50,910 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:50,910 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 179, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:50,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:50,911 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:50,911 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:51,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:51,888 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:51,919 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:51,950 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:51,982 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:52,014 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:52,045 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:52,078 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:52,081 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1691913604736328 s; generated tokens: 8 tokens; generate speed: 6.842335883117752 tokens/s +2024-07-30 14:27:52,085 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:52,086 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1731/2067], cost time 1.1809s, every example cost time is 1.1809, generate speed: 6.7747 tokens/s, avg speed: 10.2463 tokens/s, remaining time: 0:07:38 +pred is: + ['Plastid-dividing rings'] + label is: + ['plastid-dividing rings'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:27:52,169 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:52,169 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 143, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:52,170 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:52,170 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:52,170 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:53,114 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:53,147 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:53,180 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:53,211 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:53,214 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0434746742248535 s; generated tokens: 4 tokens; generate speed: 3.8333465093164865 tokens/s +2024-07-30 14:27:53,219 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:53,219 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1732/2067], cost time 1.0551s, every example cost time is 1.0551, generate speed: 3.7911 tokens/s, avg speed: 10.2434 tokens/s, remaining time: 0:07:37 +pred is: + ['White light'] + label is: + ['Light'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:27:53,301 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:53,302 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 190, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:53,302 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:53,302 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:53,303 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:54,246 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:54,280 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:54,313 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:54,345 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:54,378 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:54,410 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:54,442 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:54,476 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:54,509 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:54,541 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:54,866 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5636804103851318 s; generated tokens: 20 tokens; generate speed: 12.790337377875083 tokens/s +2024-07-30 14:27:54,871 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:54,872 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1733/2067], cost time 1.5754s, every example cost time is 1.5754, generate speed: 12.6951 tokens/s, avg speed: 10.2450 tokens/s, remaining time: 0:07:36 +pred is: + ['1'] + label is: + ['transgenes in these plastids cannot be disseminated by pollen'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:27:54,956 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:54,956 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 241, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:54,956 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:54,957 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:54,957 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:55,902 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:55,936 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:55,969 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:56,001 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:56,034 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:56,090 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:56,122 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:56,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:56,159 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2020611763000488 s; generated tokens: 8 tokens; generate speed: 6.655235322235467 tokens/s +2024-07-30 14:27:56,164 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:56,164 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1734/2067], cost time 1.2136s, every example cost time is 1.2136, generate speed: 6.5917 tokens/s, avg speed: 10.2431 tokens/s, remaining time: 0:07:34 +pred is: + ['1'] + label is: + ['itself'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:27:56,248 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:56,248 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 216, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:56,249 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:56,249 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:56,249 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:57,193 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:57,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:57,260 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:57,293 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:57,324 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:57,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:57,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:57,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:57,454 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:57,489 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:57,817 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5675609111785889 s; generated tokens: 20 tokens; generate speed: 12.758674867034525 tokens/s +2024-07-30 14:27:57,822 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:57,822 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1735/2067], cost time 1.5795s, every example cost time is 1.5795, generate speed: 12.6622 tokens/s, avg speed: 10.2448 tokens/s, remaining time: 0:07:33 +pred is: + ['primality'] + label is: + ['primality'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:27:57,907 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:57,907 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 156, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:57,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:57,908 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:57,908 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:27:58,851 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:58,885 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:58,917 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:58,950 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:58,983 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:59,015 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:59,047 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:59,080 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:59,112 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:59,115 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2068736553192139 s; generated tokens: 9 tokens; generate speed: 7.457284331572828 tokens/s +2024-07-30 14:27:59,120 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:27:59,120 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1736/2067], cost time 1.2187s, every example cost time is 1.2187, generate speed: 7.3852 tokens/s, avg speed: 10.2433 tokens/s, remaining time: 0:07:32 +pred is: + ['There are infinitely many prime numbers.'] + label is: + ['infinitely many'] +The F1/Em of this example is: {'F1': 40.0, 'Em': 0.0} +2024-07-30 14:27:59,205 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:27:59,205 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 200, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:27:59,205 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:27:59,206 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:27:59,206 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:00,150 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:00,185 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:00,218 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:00,252 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:00,285 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:00,318 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:00,322 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1157617568969727 s; generated tokens: 6 tokens; generate speed: 5.377492070248495 tokens/s +2024-07-30 14:28:00,327 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:00,327 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1737/2067], cost time 1.1277s, every example cost time is 1.1277, generate speed: 5.3204 tokens/s, avg speed: 10.2409 tokens/s, remaining time: 0:07:30 +pred is: + ["Goldbach's conjecture"] + label is: + ["Goldbach's conjecture"] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:28:00,411 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:00,411 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 194, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:00,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:00,412 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:00,412 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:01,356 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:01,389 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:01,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:01,424 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0115838050842285 s; generated tokens: 3 tokens; generate speed: 2.965646528663246 tokens/s +2024-07-30 14:28:01,429 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:01,429 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1738/2067], cost time 1.0236s, every example cost time is 1.0236, generate speed: 2.9308 tokens/s, avg speed: 10.2378 tokens/s, remaining time: 0:07:29 +pred is: + ['2'] + label is: + ['2'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:28:01,512 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:01,512 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 235, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:01,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:01,513 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:01,513 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:02,457 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:02,491 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:02,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:02,525 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.011564016342163 s; generated tokens: 3 tokens; generate speed: 2.965704544185017 tokens/s +2024-07-30 14:28:02,530 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:02,530 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1739/2067], cost time 1.0239s, every example cost time is 1.0239, generate speed: 2.9300 tokens/s, avg speed: 10.2346 tokens/s, remaining time: 0:07:27 +pred is: + ['1'] + label is: + ['1'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:28:02,642 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:02,642 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 251, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:02,643 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:02,643 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:02,643 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:03,587 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:03,621 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:03,653 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:03,687 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:03,718 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:03,750 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:03,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:03,815 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:03,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:03,851 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2075238227844238 s; generated tokens: 9 tokens; generate speed: 7.453269103417719 tokens/s +2024-07-30 14:28:03,856 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:03,856 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1740/2067], cost time 1.2194s, every example cost time is 1.2194, generate speed: 7.3805 tokens/s, avg speed: 10.2332 tokens/s, remaining time: 0:07:26 +pred is: + ['1'] + label is: + ["Euclid's fundamental theorem of arithmetic"] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 62.8641639948048, Em score: 48.62068965517241, current_count: 1740 +2024-07-30 14:28:04,458 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:04,458 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:04,459 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:04,459 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:04,459 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:05,403 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:05,437 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:05,470 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:05,502 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:05,534 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:05,567 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:05,598 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:05,630 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:05,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:05,696 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:06,037 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.577918291091919 s; generated tokens: 20 tokens; generate speed: 12.674927537699057 tokens/s +2024-07-30 14:28:06,042 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:06,043 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1741/2067], cost time 1.5899s, every example cost time is 1.5899, generate speed: 12.5796 tokens/s, avg speed: 10.2347 tokens/s, remaining time: 0:07:25 +pred is: + ['Rhind papyrus'] + label is: + ['the Rhind papyrus'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:28:06,126 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:06,126 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 226, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:06,127 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:06,127 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:06,127 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:07,072 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:07,106 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:07,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:07,172 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:07,205 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:07,238 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:07,271 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:07,304 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:07,336 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:07,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:07,699 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5711350440979004 s; generated tokens: 20 tokens; generate speed: 12.729650500211083 tokens/s +2024-07-30 14:28:07,704 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:07,704 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1742/2067], cost time 1.5829s, every example cost time is 1.5829, generate speed: 12.6354 tokens/s, avg speed: 10.2363 tokens/s, remaining time: 0:07:23 +pred is: + ['1640'] + label is: + ['In 1640'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:28:07,788 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:07,788 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 270, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:07,789 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:07,789 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:07,789 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:08,735 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:08,768 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:08,800 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:08,832 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:08,865 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:08,898 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:08,930 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:08,962 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:08,995 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:09,027 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:09,354 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5646536350250244 s; generated tokens: 20 tokens; generate speed: 12.782381705635528 tokens/s +2024-07-30 14:28:09,359 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:09,359 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1743/2067], cost time 1.5768s, every example cost time is 1.5768, generate speed: 12.6840 tokens/s, avg speed: 10.2380 tokens/s, remaining time: 0:07:22 +pred is: + ['Trial division'] + label is: + ['trial division'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:28:09,443 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:09,444 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 275, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:09,444 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:09,445 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:09,445 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:10,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:10,424 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:10,456 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:10,460 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0149598121643066 s; generated tokens: 3 tokens; generate speed: 2.9557820556488648 tokens/s +2024-07-30 14:28:10,465 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:10,465 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1744/2067], cost time 1.0269s, every example cost time is 1.0269, generate speed: 2.9213 tokens/s, avg speed: 10.2348 tokens/s, remaining time: 0:07:20 +pred is: + ['2'] + label is: + ['two main classes'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:28:10,548 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:10,548 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 252, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:10,548 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:10,549 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:10,549 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:11,494 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:11,527 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:11,559 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:11,591 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:11,622 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:11,654 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:11,686 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:11,718 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:11,749 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:11,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:12,109 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.560093879699707 s; generated tokens: 20 tokens; generate speed: 12.819741337521098 tokens/s +2024-07-30 14:28:12,114 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:12,114 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1745/2067], cost time 1.5717s, every example cost time is 1.5717, generate speed: 12.7250 tokens/s, avg speed: 10.2365 tokens/s, remaining time: 0:07:19 +pred is: + ['1'] + label is: + ['the Fermat primality test,'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:28:12,197 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:12,197 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:12,198 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:12,198 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:12,198 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:13,141 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:13,174 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:13,207 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:13,239 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:13,271 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:13,304 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:13,337 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:13,377 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:13,409 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:13,441 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:13,444 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2456848621368408 s; generated tokens: 10 tokens; generate speed: 8.027712549100144 tokens/s +2024-07-30 14:28:13,449 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:13,450 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1746/2067], cost time 1.2571s, every example cost time is 1.2571, generate speed: 7.9549 tokens/s, avg speed: 10.2352 tokens/s, remaining time: 0:07:18 +pred is: + ['2p + 1 with p prime'] + label is: + ['2p + 1'] +The F1/Em of this example is: {'F1': 57.14285714285715, 'Em': 0.0} +2024-07-30 14:28:13,532 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:13,532 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 238, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:13,533 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:13,533 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:13,533 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:14,478 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:14,511 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:14,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:14,575 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:14,607 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:14,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:14,672 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:14,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:14,738 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:14,770 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:15,089 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5552330017089844 s; generated tokens: 20 tokens; generate speed: 12.859809416352912 tokens/s +2024-07-30 14:28:15,094 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:15,094 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1747/2067], cost time 1.5671s, every example cost time is 1.5671, generate speed: 12.7623 tokens/s, avg speed: 10.2369 tokens/s, remaining time: 0:07:16 +pred is: + ['Distributed computing'] + label is: + ['distributed computing'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:28:15,183 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:15,184 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 180, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:15,184 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:15,184 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:15,185 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:16,128 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:16,161 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:16,193 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:16,224 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:16,227 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.04249906539917 s; generated tokens: 4 tokens; generate speed: 3.8369338954451835 tokens/s +2024-07-30 14:28:16,232 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:16,232 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1748/2067], cost time 1.0542s, every example cost time is 1.0542, generate speed: 3.7945 tokens/s, avg speed: 10.2341 tokens/s, remaining time: 0:07:15 +pred is: + ['Floor function'] + label is: + ['the floor function'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:28:16,315 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:16,315 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 240, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:16,315 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:16,315 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:16,316 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:17,260 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:17,293 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:17,325 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:17,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:17,389 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:17,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:17,453 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:17,485 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:17,517 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:17,548 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:17,866 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5499377250671387 s; generated tokens: 20 tokens; generate speed: 12.903744245036464 tokens/s +2024-07-30 14:28:17,871 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:17,871 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1749/2067], cost time 1.5614s, every example cost time is 1.5614, generate speed: 12.8088 tokens/s, avg speed: 10.2357 tokens/s, remaining time: 0:07:14 +pred is: + ['a and q must be relatively prime'] + label is: + ['their greatest common divisor is one'] +The F1/Em of this example is: {'F1': 8.333333333333334, 'Em': 0.0} +2024-07-30 14:28:17,962 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:17,962 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 174, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:17,963 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:17,963 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:17,963 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:18,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:18,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:18,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:19,005 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:19,036 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:19,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:19,101 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:19,132 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:19,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:19,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:19,513 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5497148036956787 s; generated tokens: 20 tokens; generate speed: 12.905600406155408 tokens/s +2024-07-30 14:28:19,518 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:19,518 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1750/2067], cost time 1.5615s, every example cost time is 1.5615, generate speed: 12.8078 tokens/s, avg speed: 10.2374 tokens/s, remaining time: 0:07:12 +pred is: + ['1'] + label is: + ['The zeta function'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 62.77092659510659, Em score: 48.457142857142856, current_count: 1750 +2024-07-30 14:28:20,138 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:20,138 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 219, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:20,139 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:20,139 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:20,139 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:21,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:21,117 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:21,149 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:21,180 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:21,212 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:21,243 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:21,275 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:21,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:21,338 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:21,370 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:21,692 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5530846118927002 s; generated tokens: 20 tokens; generate speed: 12.877598455905481 tokens/s +2024-07-30 14:28:21,697 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:21,697 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1751/2067], cost time 1.5649s, every example cost time is 1.5649, generate speed: 12.7802 tokens/s, avg speed: 10.2391 tokens/s, remaining time: 0:07:11 +pred is: + ['1859'] + label is: + ['1859'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:28:21,780 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:21,781 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 270, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:21,781 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:21,781 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:21,781 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:22,726 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:22,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:22,792 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:22,795 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0135080814361572 s; generated tokens: 3 tokens; generate speed: 2.960015864648017 tokens/s +2024-07-30 14:28:22,800 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:22,800 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1752/2067], cost time 1.0247s, every example cost time is 1.0247, generate speed: 2.9276 tokens/s, avg speed: 10.2360 tokens/s, remaining time: 0:07:10 +pred is: + ['1'] + label is: + ["Goldbach's conjecture"] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:28:22,883 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:22,883 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 231, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:22,884 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:22,884 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:22,884 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:23,828 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:23,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:23,900 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:23,932 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:23,964 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:23,997 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:24,028 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:24,032 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1471831798553467 s; generated tokens: 7 tokens; generate speed: 6.101902575735691 tokens/s +2024-07-30 14:28:24,037 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:24,037 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1753/2067], cost time 1.1591s, every example cost time is 1.1591, generate speed: 6.0391 tokens/s, avg speed: 10.2339 tokens/s, remaining time: 0:07:08 +pred is: + ['twin prime conjecture'] + label is: + ['twin prime conjecture'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:28:24,120 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:24,120 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 192, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:24,120 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:24,121 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:24,121 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:25,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:25,097 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:25,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:25,161 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:25,192 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:25,224 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:25,255 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:25,290 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:25,323 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:25,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:25,671 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5501973628997803 s; generated tokens: 20 tokens; generate speed: 12.901583036232395 tokens/s +2024-07-30 14:28:25,676 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:25,676 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1754/2067], cost time 1.5619s, every example cost time is 1.5619, generate speed: 12.8053 tokens/s, avg speed: 10.2356 tokens/s, remaining time: 0:07:07 +pred is: + ['The theory of groups'] + label is: + ['number theory'] +The F1/Em of this example is: {'F1': 40.0, 'Em': 0.0} +2024-07-30 14:28:25,760 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:25,760 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 233, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:25,761 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:25,761 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:25,761 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:26,706 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:26,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:26,772 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:26,775 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0134503841400146 s; generated tokens: 3 tokens; generate speed: 2.960184382924395 tokens/s +2024-07-30 14:28:26,779 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:26,780 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1755/2067], cost time 1.0251s, every example cost time is 1.0251, generate speed: 2.9265 tokens/s, avg speed: 10.2325 tokens/s, remaining time: 0:07:05 +pred is: + ['Recurring'] + label is: + ['a recurring decimal'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +2024-07-30 14:28:26,863 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:26,864 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 190, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:26,864 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:26,864 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:26,864 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:27,809 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:27,842 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:27,875 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:27,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:27,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:27,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:28,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:28,034 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:28,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:28,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:28,433 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5679810047149658 s; generated tokens: 20 tokens; generate speed: 12.75525656233041 tokens/s +2024-07-30 14:28:28,438 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:28,438 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1756/2067], cost time 1.5800s, every example cost time is 1.5800, generate speed: 12.6586 tokens/s, avg speed: 10.2341 tokens/s, remaining time: 0:07:04 +pred is: + ['RSA'] + label is: + ['RSA'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:28:28,521 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:28,521 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 277, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:28,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:28,522 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:28,522 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:29,467 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:29,501 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:29,534 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:29,569 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:29,602 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:29,634 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:29,668 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:29,700 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:29,732 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:29,767 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:30,099 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.577024221420288 s; generated tokens: 20 tokens; generate speed: 12.68211339327924 tokens/s +2024-07-30 14:28:30,104 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:30,104 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1757/2067], cost time 1.5887s, every example cost time is 1.5887, generate speed: 12.5890 tokens/s, avg speed: 10.2356 tokens/s, remaining time: 0:07:03 +pred is: + ['1'] + label is: + ['cicadas'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:28:30,188 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:30,189 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 224, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:30,189 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:30,189 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:30,190 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:31,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:31,168 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:31,201 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:31,235 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:31,269 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:31,302 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:31,335 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:31,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:31,405 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:31,437 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:31,771 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5808556079864502 s; generated tokens: 20 tokens; generate speed: 12.65137682338628 tokens/s +2024-07-30 14:28:31,776 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:31,776 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1758/2067], cost time 1.5927s, every example cost time is 1.5927, generate speed: 12.5569 tokens/s, avg speed: 10.2372 tokens/s, remaining time: 0:07:01 +pred is: + ['minimality or indecomposability'] + label is: + ['indecomposability'] +The F1/Em of this example is: {'F1': 33.333333333333336, 'Em': 0.0} +2024-07-30 14:28:31,860 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:31,861 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 204, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:31,861 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:31,861 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:31,862 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:32,805 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:32,839 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:32,873 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:32,906 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:32,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:32,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:33,004 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:33,036 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:33,072 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:33,106 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:33,181 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3197009563446045 s; generated tokens: 12 tokens; generate speed: 9.092969086904656 tokens/s +2024-07-30 14:28:33,186 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:33,187 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1759/2067], cost time 1.3317s, every example cost time is 1.3317, generate speed: 9.0112 tokens/s, avg speed: 10.2365 tokens/s, remaining time: 0:07:00 +pred is: + ['commutative ring'] + label is: + ['commutative ring R'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:28:33,278 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:33,278 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 192, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:33,279 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:33,279 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:33,279 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:34,223 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:34,260 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:34,293 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:34,324 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:34,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:34,361 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0818629264831543 s; generated tokens: 5 tokens; generate speed: 4.621657584897244 tokens/s +2024-07-30 14:28:34,366 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:34,366 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1760/2067], cost time 1.0935s, every example cost time is 1.0935, generate speed: 4.5723 tokens/s, avg speed: 10.2339 tokens/s, remaining time: 0:06:59 +pred is: + ['Fundamental theorem of arithmetic'] + label is: + ['The fundamental theorem of arithmetic'] +The F1/Em of this example is: {'F1': 87.50000000000001, 'Em': 0.0} +F1 score: 62.73766375460409, Em score: 48.35227272727273, current_count: 1760 +2024-07-30 14:28:34,986 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:34,986 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 194, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:34,987 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:34,987 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:34,987 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:35,931 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:35,966 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:36,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:36,035 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:36,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:36,102 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:36,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:36,138 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1512517929077148 s; generated tokens: 7 tokens; generate speed: 6.080337979166235 tokens/s +2024-07-30 14:28:36,143 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:36,144 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1761/2067], cost time 1.1633s, every example cost time is 1.1633, generate speed: 6.0175 tokens/s, avg speed: 10.2319 tokens/s, remaining time: 0:06:57 +pred is: + ['1'] + label is: + ['In ring theory'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:28:36,226 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:36,227 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 182, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:36,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:36,227 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:36,228 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:37,172 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:37,206 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:37,238 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:37,272 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:37,305 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:37,337 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:37,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:37,405 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:37,437 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:37,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:37,800 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5720348358154297 s; generated tokens: 20 tokens; generate speed: 12.722364380446955 tokens/s +2024-07-30 14:28:37,805 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:37,806 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1762/2067], cost time 1.5847s, every example cost time is 1.5847, generate speed: 12.6205 tokens/s, avg speed: 10.2335 tokens/s, remaining time: 0:06:56 +pred is: + ['The spectrum of a ring'] + label is: + ['Prime ideals'] +The F1/Em of this example is: {'F1': 16.666666666666664, 'Em': 0.0} +2024-07-30 14:28:37,899 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:37,899 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 187, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:37,900 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:37,900 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:37,900 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:38,844 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:38,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:38,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:38,943 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:38,948 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0478861331939697 s; generated tokens: 4 tokens; generate speed: 3.8172086386981294 tokens/s +2024-07-30 14:28:38,953 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:38,954 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1763/2067], cost time 1.0604s, every example cost time is 1.0604, generate speed: 3.7722 tokens/s, avg speed: 10.2306 tokens/s, remaining time: 0:06:55 +pred is: + ['1/p'] + label is: + ['norm gets smaller'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:28:39,037 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:39,038 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 179, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:39,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:39,039 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:39,039 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:39,983 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:40,016 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:40,048 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:40,082 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:40,114 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:40,146 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:40,180 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:40,212 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:40,216 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1764581203460693 s; generated tokens: 8 tokens; generate speed: 6.8000720651634445 tokens/s +2024-07-30 14:28:40,220 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:40,221 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1764/2067], cost time 1.1887s, every example cost time is 1.1887, generate speed: 6.7303 tokens/s, avg speed: 10.2289 tokens/s, remaining time: 0:06:53 +pred is: + ['Olivier Messiaen'] + label is: + ['Olivier Messiaen'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:28:40,306 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:40,306 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 224, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:40,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:40,307 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:40,307 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:41,251 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:41,285 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:41,318 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:41,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:41,384 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:41,416 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:41,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:41,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:41,520 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:41,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:41,882 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.574354648590088 s; generated tokens: 20 tokens; generate speed: 12.70361796683548 tokens/s +2024-07-30 14:28:41,887 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:41,887 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1765/2067], cost time 1.5863s, every example cost time is 1.5863, generate speed: 12.6083 tokens/s, avg speed: 10.2304 tokens/s, remaining time: 0:06:52 +pred is: + ['Swiss canton of Graubünden in the southeastern Swiss Alps'] + label is: + ['Swiss canton'] +The F1/Em of this example is: {'F1': 27.27272727272727, 'Em': 0.0} +2024-07-30 14:28:41,971 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:41,971 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 293, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:41,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:41,972 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:41,972 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:42,918 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:42,953 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:42,986 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:43,019 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:43,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:43,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:43,116 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:43,148 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:43,181 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:43,214 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:43,542 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5699968338012695 s; generated tokens: 20 tokens; generate speed: 12.738879193517917 tokens/s +2024-07-30 14:28:43,548 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:43,548 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1766/2067], cost time 1.5822s, every example cost time is 1.5822, generate speed: 12.6405 tokens/s, avg speed: 10.2320 tokens/s, remaining time: 0:06:50 +pred is: + ['Gaulish'] + label is: + ['Gaulish name Rēnos'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 14:28:43,632 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:43,632 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 203, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:43,633 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:43,633 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:43,633 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:44,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:44,612 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:44,645 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:44,678 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:44,711 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:44,743 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:44,777 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:44,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:44,843 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:44,877 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:45,215 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5817406177520752 s; generated tokens: 20 tokens; generate speed: 12.64429817097536 tokens/s +2024-07-30 14:28:45,220 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:45,221 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1767/2067], cost time 1.5942s, every example cost time is 1.5942, generate speed: 12.5453 tokens/s, avg speed: 10.2336 tokens/s, remaining time: 0:06:49 +pred is: + ['Rhine-kilometers'] + label is: + ['Rhine-kilometers'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:28:45,306 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:45,307 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 216, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:45,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:45,307 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:45,308 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:46,252 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:46,286 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:46,318 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:46,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:46,384 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:46,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:46,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:46,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:46,514 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:46,546 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:46,748 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4402062892913818 s; generated tokens: 16 tokens; generate speed: 11.109519600745813 tokens/s +2024-07-30 14:28:46,753 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:46,753 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1768/2067], cost time 1.4524s, every example cost time is 1.4524, generate speed: 11.0163 tokens/s, avg speed: 10.2340 tokens/s, remaining time: 0:06:48 +pred is: + ['North'] + label is: + ['north'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:28:46,838 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:46,838 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 186, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:46,839 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:46,839 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:46,839 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:47,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:47,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:47,849 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:47,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:47,916 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:47,921 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0814602375030518 s; generated tokens: 5 tokens; generate speed: 4.623378490127697 tokens/s +2024-07-30 14:28:47,926 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:47,926 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1769/2067], cost time 1.0941s, every example cost time is 1.0941, generate speed: 4.5698 tokens/s, avg speed: 10.2315 tokens/s, remaining time: 0:06:46 +pred is: + ['Lake Constance'] + label is: + ['Lake Constance'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:28:48,010 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:48,010 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 179, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:48,011 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:48,011 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:48,011 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:48,955 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:48,990 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:49,022 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:49,055 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:49,089 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:49,122 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:49,156 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:49,190 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:49,223 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:49,257 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:49,598 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5865612030029297 s; generated tokens: 20 tokens; generate speed: 12.605879913201854 tokens/s +2024-07-30 14:28:49,603 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:49,603 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1770/2067], cost time 1.5986s, every example cost time is 1.5986, generate speed: 12.5108 tokens/s, avg speed: 10.2330 tokens/s, remaining time: 0:06:45 +pred is: + ['Diepoldsau'] + label is: + ['Diepoldsau'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.70464836273593, Em score: 48.36158192090395, current_count: 1770 +2024-07-30 14:28:50,240 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:50,240 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 211, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:50,241 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:50,241 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:50,241 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:51,186 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:51,220 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:51,254 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:51,259 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0170893669128418 s; generated tokens: 3 tokens; generate speed: 2.949593317552676 tokens/s +2024-07-30 14:28:51,264 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:51,264 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1771/2067], cost time 1.0299s, every example cost time is 1.0299, generate speed: 2.9130 tokens/s, avg speed: 10.2298 tokens/s, remaining time: 0:06:44 +pred is: + ['3'] + label is: + ['three'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:28:51,349 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:51,350 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 237, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:51,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:51,350 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:51,351 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:52,296 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:52,330 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:52,364 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:52,397 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:52,430 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:52,464 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:52,497 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:52,530 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:52,564 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:52,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:52,937 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.585928201675415 s; generated tokens: 20 tokens; generate speed: 12.610911375982525 tokens/s +2024-07-30 14:28:52,942 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:52,943 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1772/2067], cost time 1.5991s, every example cost time is 1.5991, generate speed: 12.5069 tokens/s, avg speed: 10.2314 tokens/s, remaining time: 0:06:42 +pred is: + ['The cold water is denser than the warm water.'] + label is: + ['greater density of cold water'] +The F1/Em of this example is: {'F1': 29.629629629629626, 'Em': 0.0} +2024-07-30 14:28:53,028 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:53,029 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 238, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:53,029 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:53,030 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:53,030 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:53,975 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:54,010 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:54,043 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:54,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:54,081 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.050590991973877 s; generated tokens: 4 tokens; generate speed: 3.8073808271330205 tokens/s +2024-07-30 14:28:54,085 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:54,086 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1773/2067], cost time 1.0630s, every example cost time is 1.0630, generate speed: 3.7628 tokens/s, avg speed: 10.2285 tokens/s, remaining time: 0:06:41 +pred is: + ['Westward'] + label is: + ['westward'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:28:54,170 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:54,170 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 203, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:54,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:54,171 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:54,171 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:55,115 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:55,149 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:55,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:55,215 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:55,218 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0468592643737793 s; generated tokens: 4 tokens; generate speed: 3.8209529553074737 tokens/s +2024-07-30 14:28:55,223 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:55,223 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1774/2067], cost time 1.0587s, every example cost time is 1.0587, generate speed: 3.7782 tokens/s, avg speed: 10.2257 tokens/s, remaining time: 0:06:39 +pred is: + ['Basel'] + label is: + ['Basel'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:28:55,309 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:55,310 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:55,310 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:55,311 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:55,311 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:56,254 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:56,288 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:56,320 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:56,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:56,385 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:56,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:56,449 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:56,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:56,515 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:56,546 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:56,877 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5665028095245361 s; generated tokens: 20 tokens; generate speed: 12.767292773685089 tokens/s +2024-07-30 14:28:56,882 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:56,883 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1775/2067], cost time 1.5792s, every example cost time is 1.5792, generate speed: 12.6646 tokens/s, avg speed: 10.2273 tokens/s, remaining time: 0:06:38 +pred is: + ['19th'] + label is: + ['19th Century'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:28:56,967 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:56,968 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 211, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:56,968 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:56,968 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:56,969 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:57,913 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:57,947 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:57,981 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:58,014 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:58,046 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:58,080 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:58,112 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:58,144 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:58,178 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:58,211 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:58,280 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3109655380249023 s; generated tokens: 12 tokens; generate speed: 9.153558695432354 tokens/s +2024-07-30 14:28:58,285 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:58,285 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1776/2067], cost time 1.3229s, every example cost time is 1.3229, generate speed: 9.0713 tokens/s, avg speed: 10.2267 tokens/s, remaining time: 0:06:37 +pred is: + ['The Rhine encounters the Neckar in Germany.'] + label is: + ['Germany'] +The F1/Em of this example is: {'F1': 13.333333333333334, 'Em': 0.0} +2024-07-30 14:28:58,369 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:58,369 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 170, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:58,370 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:58,370 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:58,370 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:28:59,314 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:59,347 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:59,380 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:59,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:59,447 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:59,451 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0810203552246094 s; generated tokens: 5 tokens; generate speed: 4.625259807398468 tokens/s +2024-07-30 14:28:59,456 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:28:59,457 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1777/2067], cost time 1.0930s, every example cost time is 1.0930, generate speed: 4.5744 tokens/s, avg speed: 10.2241 tokens/s, remaining time: 0:06:35 +pred is: + ['The Rhine'] + label is: + ['Middle Rhine'] +The F1/Em of this example is: {'F1': 66.66666666666666, 'Em': 0.0} +2024-07-30 14:28:59,540 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:28:59,541 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 249, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:28:59,541 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:28:59,542 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:28:59,542 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:00,487 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:00,523 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:00,557 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:00,590 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:00,623 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:00,655 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:00,689 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:00,721 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:00,754 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:00,787 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:01,112 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5696208477020264 s; generated tokens: 20 tokens; generate speed: 12.741930657509181 tokens/s +2024-07-30 14:29:01,117 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:01,117 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1778/2067], cost time 1.5818s, every example cost time is 1.5818, generate speed: 12.6436 tokens/s, avg speed: 10.2257 tokens/s, remaining time: 0:06:34 +pred is: + ['Industry'] + label is: + ['plants and factories'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:29:01,200 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:01,200 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 169, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:01,200 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:01,201 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:01,201 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:02,144 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:02,178 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:02,211 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:02,243 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:02,247 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0465688705444336 s; generated tokens: 4 tokens; generate speed: 3.8220131637578403 tokens/s +2024-07-30 14:29:02,252 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:02,253 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1779/2067], cost time 1.0581s, every example cost time is 1.0581, generate speed: 3.7802 tokens/s, avg speed: 10.2229 tokens/s, remaining time: 0:06:33 +pred is: + ['tourism'] + label is: + ['tourism'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:29:02,336 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:02,337 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 241, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:02,337 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:02,337 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:02,337 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:03,282 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:03,316 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:03,349 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:03,353 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.015317440032959 s; generated tokens: 3 tokens; generate speed: 2.95474093294666 tokens/s +2024-07-30 14:29:03,358 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:03,358 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1780/2067], cost time 1.0275s, every example cost time is 1.0275, generate speed: 2.9197 tokens/s, avg speed: 10.2198 tokens/s, remaining time: 0:06:31 +pred is: + ['Duisburg'] + label is: + ['Duisburg'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.666773725658565, Em score: 48.31460674157304, current_count: 1780 +2024-07-30 14:29:03,975 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:03,975 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 251, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:03,976 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:03,976 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:03,976 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:04,921 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:04,955 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:04,987 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:05,019 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:05,022 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0451703071594238 s; generated tokens: 4 tokens; generate speed: 3.827127476354784 tokens/s +2024-07-30 14:29:05,026 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:05,027 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1781/2067], cost time 1.0572s, every example cost time is 1.0572, generate speed: 3.7834 tokens/s, avg speed: 10.2170 tokens/s, remaining time: 0:06:30 +pred is: + ['Meuse'] + label is: + ['Meuse'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:29:05,109 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:05,110 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 190, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:05,110 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:05,110 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:05,110 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:06,054 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:06,088 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:06,119 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:06,151 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:06,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:06,215 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:06,247 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:06,280 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:06,283 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1719715595245361 s; generated tokens: 8 tokens; generate speed: 6.82610421301142 tokens/s +2024-07-30 14:29:06,288 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:06,288 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1782/2067], cost time 1.1838s, every example cost time is 1.1838, generate speed: 6.7579 tokens/s, avg speed: 10.2153 tokens/s, remaining time: 0:06:28 +pred is: + ['Pannerdens Kanaal'] + label is: + ['Pannerdens Kanaal'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:29:06,371 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:06,371 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 247, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:06,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:06,372 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:06,372 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:07,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:07,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:07,384 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:07,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:07,447 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:07,480 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:07,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:07,515 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1427550315856934 s; generated tokens: 7 tokens; generate speed: 6.12554730149537 tokens/s +2024-07-30 14:29:07,520 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:07,520 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1783/2067], cost time 1.1545s, every example cost time is 1.1545, generate speed: 6.0634 tokens/s, avg speed: 10.2133 tokens/s, remaining time: 0:06:27 +pred is: + ['Kromme Rijn'] + label is: + ['Rijn'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:29:07,604 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:07,604 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 179, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:07,605 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:07,605 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:07,605 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:08,549 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:08,585 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:08,616 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:08,649 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:08,682 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:08,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:08,747 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:08,780 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:08,783 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.177581787109375 s; generated tokens: 8 tokens; generate speed: 6.7935833311737115 tokens/s +2024-07-30 14:29:08,788 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:08,788 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1784/2067], cost time 1.1895s, every example cost time is 1.1895, generate speed: 6.7257 tokens/s, avg speed: 10.2116 tokens/s, remaining time: 0:06:26 +pred is: + ['Rhine-Meuse Delta'] + label is: + ['Rhine-Meuse'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:29:08,872 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:08,872 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 355, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:08,873 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:08,873 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:08,873 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:09,820 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:09,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:09,888 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:09,921 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:09,953 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:09,986 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:10,018 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:10,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:10,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:10,117 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:10,467 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.593724250793457 s; generated tokens: 20 tokens; generate speed: 12.54922235765863 tokens/s +2024-07-30 14:29:10,473 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:10,473 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1785/2067], cost time 1.6065s, every example cost time is 1.6065, generate speed: 12.4497 tokens/s, avg speed: 10.2131 tokens/s, remaining time: 0:06:24 +pred is: + ['Waal'] + label is: + ['Nederrijn at Angeren'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:29:10,558 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:10,559 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 194, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:10,559 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:10,560 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:10,560 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:11,506 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:11,541 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:11,574 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:11,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:11,638 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:11,671 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:11,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:11,736 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:11,770 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:11,803 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:12,131 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5706913471221924 s; generated tokens: 20 tokens; generate speed: 12.733246437400851 tokens/s +2024-07-30 14:29:12,136 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:12,136 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1786/2067], cost time 1.5830s, every example cost time is 1.5830, generate speed: 12.6341 tokens/s, avg speed: 10.2147 tokens/s, remaining time: 0:06:23 +pred is: + ["St. Elizabeth's flood"] + label is: + ["St. Elizabeth's"] +The F1/Em of this example is: {'F1': 85.71428571428571, 'Em': 0.0} +2024-07-30 14:29:12,219 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:12,220 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 194, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:12,220 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:12,220 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:12,221 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:13,165 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:13,198 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:13,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:13,262 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:13,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:13,326 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:13,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:13,392 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:13,424 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:13,463 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:13,787 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5663256645202637 s; generated tokens: 20 tokens; generate speed: 12.768736702099321 tokens/s +2024-07-30 14:29:13,792 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:13,792 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1787/2067], cost time 1.5780s, every example cost time is 1.5780, generate speed: 12.6741 tokens/s, avg speed: 10.2163 tokens/s, remaining time: 0:06:22 +pred is: + ['drainage channels for the numerous polders'] + label is: + ['drainage channels'] +The F1/Em of this example is: {'F1': 42.857142857142854, 'Em': 0.0} +2024-07-30 14:29:13,881 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:13,882 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 169, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:13,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:13,882 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:13,883 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:14,826 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:14,862 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:14,899 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:14,931 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:14,965 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:14,969 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0864691734313965 s; generated tokens: 5 tokens; generate speed: 4.602063383177726 tokens/s +2024-07-30 14:29:14,974 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:14,974 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1788/2067], cost time 1.0983s, every example cost time is 1.0983, generate speed: 4.5527 tokens/s, avg speed: 10.2137 tokens/s, remaining time: 0:06:20 +pred is: + ['Tidal Delta'] + label is: + ['tidal delta'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:29:15,059 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:15,060 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 266, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:15,060 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:15,060 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:15,061 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:16,006 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:16,039 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:16,073 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:16,106 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:16,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:16,173 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:16,207 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:16,239 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:16,273 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:16,306 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:16,343 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2820956707000732 s; generated tokens: 11 tokens; generate speed: 8.579702943691855 tokens/s +2024-07-30 14:29:16,348 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:16,348 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1789/2067], cost time 1.2944s, every example cost time is 1.2944, generate speed: 8.4983 tokens/s, avg speed: 10.2128 tokens/s, remaining time: 0:06:19 +pred is: + ['Tethys'] + label is: + ['Tethys sea'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:29:16,434 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:16,434 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 180, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:16,435 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:16,435 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:16,435 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:17,380 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:17,420 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:17,453 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:17,486 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:17,519 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:17,554 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:17,588 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:17,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:17,652 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:17,686 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:18,019 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5835981369018555 s; generated tokens: 20 tokens; generate speed: 12.629466740298087 tokens/s +2024-07-30 14:29:18,024 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:18,024 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1790/2067], cost time 1.5958s, every example cost time is 1.5958, generate speed: 12.5326 tokens/s, avg speed: 10.2143 tokens/s, remaining time: 0:06:18 +pred is: + ['Upper Rhine Graben'] + label is: + ['N–S'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 62.63990427946573, Em score: 48.212290502793294, current_count: 1790 +2024-07-30 14:29:18,671 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:18,672 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 204, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:18,672 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:18,672 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:18,673 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:19,617 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:19,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:19,685 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:19,718 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:19,750 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:19,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:19,815 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:19,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:19,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:19,912 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:20,260 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5871574878692627 s; generated tokens: 20 tokens; generate speed: 12.60114396514597 tokens/s +2024-07-30 14:29:20,265 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:20,265 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1791/2067], cost time 1.5993s, every example cost time is 1.5993, generate speed: 12.5056 tokens/s, avg speed: 10.2158 tokens/s, remaining time: 0:06:16 +pred is: + ['Through stream capture'] + label is: + ['stream capture'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:29:20,349 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:20,349 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 268, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:20,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:20,350 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:20,350 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:21,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:21,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:21,362 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:21,394 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:21,426 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:21,459 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:21,491 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:21,523 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:21,555 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:21,588 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:21,946 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5957365036010742 s; generated tokens: 20 tokens; generate speed: 12.53339755960104 tokens/s +2024-07-30 14:29:21,951 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:21,952 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1792/2067], cost time 1.6078s, every example cost time is 1.6078, generate speed: 12.4395 tokens/s, avg speed: 10.2173 tokens/s, remaining time: 0:06:15 +pred is: + ['Pleistocene'] + label is: + ['Ice Ages'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:29:22,035 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:22,035 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 191, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:22,036 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:22,036 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:22,036 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:22,980 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:23,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:23,045 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:23,078 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:23,110 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:23,142 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:23,146 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1099505424499512 s; generated tokens: 6 tokens; generate speed: 5.405646261279742 tokens/s +2024-07-30 14:29:23,151 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:23,152 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1793/2067], cost time 1.1219s, every example cost time is 1.1219, generate speed: 5.3482 tokens/s, avg speed: 10.2151 tokens/s, remaining time: 0:06:13 +pred is: + ['74,000 BP'] + label is: + ['74,000 (BP'] +The F1/Em of this example is: {'F1': 72.72727272727272, 'Em': 0.0} +2024-07-30 14:29:23,235 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:23,235 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 185, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:23,236 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:23,236 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:23,236 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:24,180 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:24,213 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:24,245 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:24,279 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:24,311 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:24,343 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:24,377 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:24,409 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:24,441 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:24,474 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:24,804 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.567479133605957 s; generated tokens: 20 tokens; generate speed: 12.759340504897418 tokens/s +2024-07-30 14:29:24,808 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:24,809 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1794/2067], cost time 1.5796s, every example cost time is 1.5796, generate speed: 12.6616 tokens/s, avg speed: 10.2166 tokens/s, remaining time: 0:06:12 +pred is: + ['1'] + label is: + ['glacier'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:29:24,892 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:24,892 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 183, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:24,893 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:24,893 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:24,893 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:25,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:25,871 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:25,904 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:25,936 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:25,970 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:26,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:26,034 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:26,068 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:26,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:26,132 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:26,484 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5907902717590332 s; generated tokens: 20 tokens; generate speed: 12.572367555331343 tokens/s +2024-07-30 14:29:26,489 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:26,490 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1795/2067], cost time 1.6026s, every example cost time is 1.6026, generate speed: 12.4795 tokens/s, avg speed: 10.2181 tokens/s, remaining time: 0:06:11 +pred is: + ['22,000 years ago'] + label is: + ['22,000 years ago'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:29:26,574 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:26,574 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 181, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:26,574 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:26,575 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:26,575 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:27,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:27,553 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:27,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:27,630 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:27,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:27,697 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:27,729 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:27,762 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:27,795 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:27,827 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:28,153 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5778050422668457 s; generated tokens: 20 tokens; generate speed: 12.675837295630538 tokens/s +2024-07-30 14:29:28,158 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:28,158 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1796/2067], cost time 1.5896s, every example cost time is 1.5896, generate speed: 12.5816 tokens/s, avg speed: 10.2196 tokens/s, remaining time: 0:06:09 +pred is: + ['7500 years ago'] + label is: + ['7500 yr ago'] +The F1/Em of this example is: {'F1': 40.00000000000001, 'Em': 0.0} +2024-07-30 14:29:28,241 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:28,241 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 185, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:28,242 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:28,242 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:28,242 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:29,186 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:29,219 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:29,251 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:29,284 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:29,316 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:29,348 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:29,381 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:29,413 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:29,445 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:29,479 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:29,616 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.373784065246582 s; generated tokens: 14 tokens; generate speed: 10.190830097805163 tokens/s +2024-07-30 14:29:29,621 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:29,621 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1797/2067], cost time 1.3858s, every example cost time is 1.3858, generate speed: 10.1022 tokens/s, avg speed: 10.2196 tokens/s, remaining time: 0:06:08 +pred is: + ['11,700 years ago'] + label is: + ['11,700 years ago'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:29:29,707 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:29,707 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 257, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:29,708 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:29,708 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:29,708 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:30,653 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:30,687 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:30,720 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:30,751 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:30,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:30,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:30,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:30,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:30,914 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:30,948 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:31,050 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3416168689727783 s; generated tokens: 13 tokens; generate speed: 9.689800643274241 tokens/s +2024-07-30 14:29:31,055 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:31,055 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1798/2067], cost time 1.3546s, every example cost time is 1.3546, generate speed: 9.5970 tokens/s, avg speed: 10.2192 tokens/s, remaining time: 0:06:07 +pred is: + ['Since ~3000 yr BP (= years Before Present)'] + label is: + ['3000 yr BP'] +The F1/Em of this example is: {'F1': 47.61904761904761, 'Em': 0.0} +2024-07-30 14:29:31,139 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:31,139 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 228, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:31,140 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:31,140 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:31,140 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:32,085 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:32,120 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:32,154 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:32,189 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:32,223 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:32,257 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:32,292 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:32,324 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:32,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:32,392 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:32,741 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.6004042625427246 s; generated tokens: 20 tokens; generate speed: 12.496842496672667 tokens/s +2024-07-30 14:29:32,747 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:32,747 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1799/2067], cost time 1.6136s, every example cost time is 1.6136, generate speed: 12.3943 tokens/s, avg speed: 10.2207 tokens/s, remaining time: 0:06:05 +pred is: + ['The North Sea'] + label is: + ['North Sea'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:29:32,834 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:32,834 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 245, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:32,835 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:32,835 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:32,835 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:33,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:33,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:33,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:33,885 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:33,918 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:33,950 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:33,985 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:34,018 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:34,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:34,085 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:34,420 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.584855318069458 s; generated tokens: 20 tokens; generate speed: 12.619448458148455 tokens/s +2024-07-30 14:29:34,426 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:34,427 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1800/2067], cost time 1.5999s, every example cost time is 1.5999, generate speed: 12.5005 tokens/s, avg speed: 10.2221 tokens/s, remaining time: 0:06:04 +pred is: + ['1st century BC'] + label is: + ['1st century BC'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.63098610032777, Em score: 48.111111111111114, current_count: 1800 +2024-07-30 14:29:35,083 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:35,083 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 231, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:35,084 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:35,084 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:35,084 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:36,028 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:36,062 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:36,095 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:36,126 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:36,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:36,192 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:36,223 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:36,263 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:36,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:36,327 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:36,670 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5852234363555908 s; generated tokens: 20 tokens; generate speed: 12.616517988139107 tokens/s +2024-07-30 14:29:36,675 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:36,675 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1801/2067], cost time 1.5974s, every example cost time is 1.5974, generate speed: 12.5203 tokens/s, avg speed: 10.2236 tokens/s, remaining time: 0:06:03 +pred is: + ['AD 14'] + label is: + ['AD 14'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:29:36,758 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:36,758 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 207, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:36,759 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:36,759 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:36,759 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:37,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:37,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:37,774 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:37,778 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0189392566680908 s; generated tokens: 3 tokens; generate speed: 2.9442383148627864 tokens/s +2024-07-30 14:29:37,783 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:37,783 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1802/2067], cost time 1.0307s, every example cost time is 1.0307, generate speed: 2.9107 tokens/s, avg speed: 10.2206 tokens/s, remaining time: 0:06:01 +pred is: + ['8'] + label is: + ['eight'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:29:37,866 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:37,867 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 193, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:37,867 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:37,868 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:37,868 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:38,812 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:38,846 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:38,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:38,912 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:38,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:38,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:39,009 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:39,041 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:39,075 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:39,107 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:39,372 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.503755807876587 s; generated tokens: 18 tokens; generate speed: 11.97002858158022 tokens/s +2024-07-30 14:29:39,377 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:39,377 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1803/2067], cost time 1.5156s, every example cost time is 1.5156, generate speed: 11.8766 tokens/s, avg speed: 10.2216 tokens/s, remaining time: 0:06:00 +pred is: + ['5th century'] + label is: + ['5th century'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:29:39,489 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:39,489 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 248, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:39,490 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:39,491 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:39,491 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:40,437 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:40,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:40,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:40,537 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:40,572 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:40,605 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:40,637 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:40,671 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:40,728 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:40,762 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:41,092 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.6004002094268799 s; generated tokens: 20 tokens; generate speed: 12.496874145725219 tokens/s +2024-07-30 14:29:41,096 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:41,097 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1804/2067], cost time 1.6152s, every example cost time is 1.6152, generate speed: 12.3823 tokens/s, avg speed: 10.2230 tokens/s, remaining time: 0:05:59 +pred is: + ['6th century'] + label is: + ['6th century'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:29:41,181 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:41,182 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 241, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:41,182 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:41,183 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:41,183 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:42,128 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:42,162 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:42,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:42,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:42,260 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:42,293 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:42,324 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:42,357 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:42,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:42,422 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:42,751 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5677838325500488 s; generated tokens: 20 tokens; generate speed: 12.756860725798774 tokens/s +2024-07-30 14:29:42,756 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:42,756 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1805/2067], cost time 1.5798s, every example cost time is 1.5798, generate speed: 12.6599 tokens/s, avg speed: 10.2246 tokens/s, remaining time: 0:05:57 +pred is: + ['Peace of Westphalia'] + label is: + ['Peace of Westphalia'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:29:42,839 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:42,840 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 207, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:42,840 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:42,840 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:42,841 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:43,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:43,820 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:43,853 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:43,886 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:43,890 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0493395328521729 s; generated tokens: 4 tokens; generate speed: 3.811921570445117 tokens/s +2024-07-30 14:29:43,895 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:43,895 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1806/2067], cost time 1.0615s, every example cost time is 1.0615, generate speed: 3.7683 tokens/s, avg speed: 10.2218 tokens/s, remaining time: 0:05:56 +pred is: + ['1919'] + label is: + ['end of World War I'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:29:43,978 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:43,979 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 238, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:43,979 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:43,980 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:43,980 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:44,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:44,959 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:44,992 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:45,024 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:45,056 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:45,061 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.08064866065979 s; generated tokens: 5 tokens; generate speed: 4.626850688869822 tokens/s +2024-07-30 14:29:45,065 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:45,066 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1807/2067], cost time 1.0925s, every example cost time is 1.0925, generate speed: 4.5769 tokens/s, avg speed: 10.2193 tokens/s, remaining time: 0:05:55 +pred is: + ['Arnhem'] + label is: + ['Arnhem'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:29:45,172 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:45,173 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:45,173 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:45,173 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:45,173 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:46,117 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:46,151 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:46,184 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:46,217 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:46,248 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:46,281 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:46,313 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:46,345 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:46,378 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:46,412 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:46,482 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3080179691314697 s; generated tokens: 12 tokens; generate speed: 9.174185892849819 tokens/s +2024-07-30 14:29:46,486 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:46,487 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1808/2067], cost time 1.3199s, every example cost time is 1.3199, generate speed: 9.0916 tokens/s, avg speed: 10.2187 tokens/s, remaining time: 0:05:53 +pred is: + ['1,230'] + label is: + ['1,230 kilometres (764 miles)'] +The F1/Em of this example is: {'F1': 42.857142857142854, 'Em': 0.0} +2024-07-30 14:29:46,570 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:46,570 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 194, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:46,571 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:46,571 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:46,571 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:47,515 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:47,548 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:47,583 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:47,616 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:47,648 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:47,682 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:47,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:47,747 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:47,781 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:47,813 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:48,014 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.442521333694458 s; generated tokens: 16 tokens; generate speed: 11.0916903800807 tokens/s +2024-07-30 14:29:48,019 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:48,019 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1809/2067], cost time 1.4543s, every example cost time is 1.4543, generate speed: 11.0018 tokens/s, avg speed: 10.2192 tokens/s, remaining time: 0:05:52 +pred is: + ['1999'] + label is: + ['Following a referendum in 1997'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:29:48,104 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:48,104 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 242, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:48,105 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:48,105 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:48,105 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:49,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:49,083 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:49,115 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:49,147 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:49,181 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:49,213 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:49,245 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:49,279 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:49,311 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:49,342 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:49,713 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.6073195934295654 s; generated tokens: 20 tokens; generate speed: 12.443076088760703 tokens/s +2024-07-30 14:29:49,717 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:49,718 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1810/2067], cost time 1.6191s, every example cost time is 1.6191, generate speed: 12.3527 tokens/s, avg speed: 10.2205 tokens/s, remaining time: 0:05:50 +pred is: + ['The lack of a Parliament of Scotland'] + label is: + ['lack of a Parliament of Scotland'] +The F1/Em of this example is: {'F1': 91.66666666666666, 'Em': 0.0} +F1 score: 62.635524193433035, Em score: 48.12154696132597, current_count: 1810 +2024-07-30 14:29:50,342 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:50,342 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 162, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:50,343 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:50,343 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:50,343 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:51,287 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:51,321 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:51,353 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:51,387 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:51,419 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:51,451 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:51,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:51,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:51,548 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:51,582 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:51,911 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.567194938659668 s; generated tokens: 20 tokens; generate speed: 12.761654282207454 tokens/s +2024-07-30 14:29:51,915 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:51,916 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1811/2067], cost time 1.5793s, every example cost time is 1.5793, generate speed: 12.6634 tokens/s, avg speed: 10.2221 tokens/s, remaining time: 0:05:49 +pred is: + ['North Sea'] + label is: + ['North'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:29:52,000 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:52,001 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 192, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:52,001 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:52,001 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:52,001 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:52,946 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:52,981 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:53,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:53,045 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:53,079 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:53,111 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:53,143 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:53,177 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:53,210 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:53,243 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:53,576 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5739367008209229 s; generated tokens: 20 tokens; generate speed: 12.706991322820379 tokens/s +2024-07-30 14:29:53,580 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:53,581 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1812/2067], cost time 1.5857s, every example cost time is 1.5857, generate speed: 12.6125 tokens/s, avg speed: 10.2236 tokens/s, remaining time: 0:05:48 +pred is: + ['Edinburgh'] + label is: + ['Edinburgh'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:29:53,665 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:53,665 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 175, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:53,666 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:53,666 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:53,666 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:54,609 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:54,644 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:54,678 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:54,711 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:54,743 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:54,776 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:54,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:54,840 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:54,873 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:54,905 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:55,231 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5645439624786377 s; generated tokens: 20 tokens; generate speed: 12.78327773437244 tokens/s +2024-07-30 14:29:55,236 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:55,236 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1813/2067], cost time 1.5766s, every example cost time is 1.5766, generate speed: 12.6853 tokens/s, avg speed: 10.2252 tokens/s, remaining time: 0:05:46 +pred is: + ['Demand for a Scottish Parliament grew'] + label is: + ['a Scottish Parliament'] +The F1/Em of this example is: {'F1': 62.5, 'Em': 0.0} +2024-07-30 14:29:55,321 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:55,322 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 211, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:55,322 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:55,322 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:55,322 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:56,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:56,300 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:56,332 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:56,366 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:56,399 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:56,431 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:56,465 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:56,499 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:56,531 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:56,567 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:56,898 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5754568576812744 s; generated tokens: 20 tokens; generate speed: 12.69473035868186 tokens/s +2024-07-30 14:29:56,903 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:56,903 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1814/2067], cost time 1.5873s, every example cost time is 1.5873, generate speed: 12.6001 tokens/s, avg speed: 10.2267 tokens/s, remaining time: 0:05:45 +pred is: + ['In the Holyrood area of Edinburgh'] + label is: + ['Scottish Parliament Building'] +The F1/Em of this example is: {'F1': 12.500000000000004, 'Em': 0.0} +2024-07-30 14:29:56,987 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:56,988 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 168, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:56,988 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:56,988 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:56,988 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:57,932 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:57,966 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:57,999 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:58,030 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:58,063 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:58,095 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:58,127 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:58,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:58,163 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1743087768554688 s; generated tokens: 8 tokens; generate speed: 6.8125182725979245 tokens/s +2024-07-30 14:29:58,168 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:58,168 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1815/2067], cost time 1.1861s, every example cost time is 1.1861, generate speed: 6.7450 tokens/s, avg speed: 10.2251 tokens/s, remaining time: 0:05:44 +pred is: + ["The Church's General Assembly Hall"] + label is: + ["meeting of the Church's General Assembly"] +The F1/Em of this example is: {'F1': 75.00000000000001, 'Em': 0.0} +2024-07-30 14:29:58,252 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:58,252 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 168, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:58,253 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:58,253 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:58,253 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:29:59,197 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:59,231 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:59,265 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:59,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:59,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:59,363 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:59,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:59,429 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:59,464 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:59,496 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:59,831 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5774288177490234 s; generated tokens: 20 tokens; generate speed: 12.678860545060802 tokens/s +2024-07-30 14:29:59,836 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:29:59,836 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1816/2067], cost time 1.5898s, every example cost time is 1.5898, generate speed: 12.5804 tokens/s, avg speed: 10.2266 tokens/s, remaining time: 0:05:42 +pred is: + ['The City of Edinburgh Council'] + label is: + ['City of Edinburgh Council'] +The F1/Em of this example is: {'F1': 87.50000000000001, 'Em': 0.0} +2024-07-30 14:29:59,926 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:29:59,927 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 244, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:29:59,928 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:29:59,928 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:29:59,928 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:00,873 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:00,907 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:00,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:00,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:01,004 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:01,035 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:01,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:01,102 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:01,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:01,168 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:01,500 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5713543891906738 s; generated tokens: 20 tokens; generate speed: 12.727873570455994 tokens/s +2024-07-30 14:30:01,504 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:01,505 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1817/2067], cost time 1.5835s, every example cost time is 1.5835, generate speed: 12.6305 tokens/s, avg speed: 10.2281 tokens/s, remaining time: 0:05:41 +pred is: + ['Presiding Officer'] + label is: + ['one MSP'] +The F1/Em of this example is: {'F1': 33.33333333333333, 'Em': 0.0} +2024-07-30 14:30:01,589 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:01,589 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 207, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:01,590 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:01,590 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:01,590 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:02,535 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:02,569 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:02,602 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:02,635 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:02,674 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:02,706 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:02,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:02,773 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:02,806 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:02,840 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:03,178 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.587174654006958 s; generated tokens: 20 tokens; generate speed: 12.601007677074662 tokens/s +2024-07-30 14:30:03,183 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:03,183 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1818/2067], cost time 1.5990s, every example cost time is 1.5990, generate speed: 12.5078 tokens/s, avg speed: 10.2296 tokens/s, remaining time: 0:05:40 +pred is: + ['1'] + label is: + ['Presiding Officer'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:30:03,266 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:03,267 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 258, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:03,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:03,267 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:03,268 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:04,212 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:04,246 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:04,280 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:04,312 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:04,344 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:04,378 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:04,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:04,450 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:04,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:04,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:04,844 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5758798122406006 s; generated tokens: 20 tokens; generate speed: 12.691323186356334 tokens/s +2024-07-30 14:30:04,849 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:04,849 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1819/2067], cost time 1.5881s, every example cost time is 1.5881, generate speed: 12.5939 tokens/s, avg speed: 10.2311 tokens/s, remaining time: 0:05:38 +pred is: + ['The debating chamber of the Scottish Parliament has seating arranged in a hemicycle, which reflects the desire'] + label is: + ['hemicycle'] +The F1/Em of this example is: {'F1': 5.714285714285714, 'Em': 0.0} +2024-07-30 14:30:04,935 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:04,935 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 225, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:04,936 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:04,936 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:04,936 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:05,881 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:05,914 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:05,946 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:05,979 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:06,011 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:06,014 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0778379440307617 s; generated tokens: 5 tokens; generate speed: 4.63891629320604 tokens/s +2024-07-30 14:30:06,019 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:06,019 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1820/2067], cost time 1.0902s, every example cost time is 1.0902, generate speed: 4.5862 tokens/s, avg speed: 10.2286 tokens/s, remaining time: 0:05:37 +pred is: + ['Scottish rivers'] + label is: + ['Scottish rivers'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.58068484019858, Em score: 47.967032967032964, current_count: 1820 +2024-07-30 14:30:06,649 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:06,650 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 206, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:06,650 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:06,650 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:06,651 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:07,595 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:07,629 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:07,663 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:07,697 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:07,729 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:07,763 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:07,796 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:07,829 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:07,833 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1822524070739746 s; generated tokens: 8 tokens; generate speed: 6.766744522685867 tokens/s +2024-07-30 14:30:07,838 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:07,838 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1821/2067], cost time 1.1945s, every example cost time is 1.1945, generate speed: 6.6976 tokens/s, avg speed: 10.2269 tokens/s, remaining time: 0:05:36 +pred is: + ['4'] + label is: + ['April'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:30:07,922 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:07,922 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 172, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:07,922 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:07,923 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:07,923 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:08,866 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:08,900 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:08,932 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:08,937 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0137133598327637 s; generated tokens: 3 tokens; generate speed: 2.959416457227043 tokens/s +2024-07-30 14:30:08,942 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:08,942 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1822/2067], cost time 1.0258s, every example cost time is 1.0258, generate speed: 2.9245 tokens/s, avg speed: 10.2239 tokens/s, remaining time: 0:05:34 +pred is: + ['Wednesday'] + label is: + ['Wednesdays'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:30:09,025 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:09,026 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 230, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:09,026 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:09,027 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:09,027 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:09,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:10,005 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:10,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:10,072 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:10,105 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:10,137 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:10,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:10,204 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:10,237 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:10,270 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:10,477 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4500367641448975 s; generated tokens: 16 tokens; generate speed: 11.03420299100856 tokens/s +2024-07-30 14:30:10,482 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:10,482 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1823/2067], cost time 1.4621s, every example cost time is 1.4621, generate speed: 10.9429 tokens/s, avg speed: 10.2243 tokens/s, remaining time: 0:05:33 +pred is: + ['The Presiding Officer (or Deputy Presiding Officer)'] + label is: + ['The Presiding Officer'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:30:10,567 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:10,568 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 237, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:10,568 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:10,568 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:10,569 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:11,513 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:11,548 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:11,581 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:11,614 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:11,617 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0480906963348389 s; generated tokens: 4 tokens; generate speed: 3.81646360757514 tokens/s +2024-07-30 14:30:11,622 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:11,622 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1824/2067], cost time 1.0600s, every example cost time is 1.0600, generate speed: 3.7736 tokens/s, avg speed: 10.2216 tokens/s, remaining time: 0:05:31 +pred is: + ['5 pm'] + label is: + ['5 pm'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:30:11,706 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:11,707 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 216, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:11,707 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:11,707 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:11,707 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:12,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:12,685 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:12,718 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:12,750 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:12,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:12,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:12,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:12,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:12,915 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:12,947 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:13,276 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5680410861968994 s; generated tokens: 20 tokens; generate speed: 12.754767828506116 tokens/s +2024-07-30 14:30:13,280 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:13,281 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1825/2067], cost time 1.5804s, every example cost time is 1.5804, generate speed: 12.6554 tokens/s, avg speed: 10.2231 tokens/s, remaining time: 0:05:30 +pred is: + ['1'] + label is: + ['votes'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:30:13,365 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:13,366 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 166, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:13,366 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:13,366 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:13,366 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:14,310 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:14,343 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:14,377 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:14,410 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:14,442 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:14,481 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:14,485 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1187646389007568 s; generated tokens: 6 tokens; generate speed: 5.363058315728772 tokens/s +2024-07-30 14:30:14,490 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:14,490 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1826/2067], cost time 1.1307s, every example cost time is 1.1307, generate speed: 5.3064 tokens/s, avg speed: 10.2209 tokens/s, remaining time: 0:05:29 +pred is: + ['Immediately after Decision Time'] + label is: + ['Immediately after Decision Time'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:30:14,575 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:14,575 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:14,576 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:14,576 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:14,576 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:15,519 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:15,553 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:15,587 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:15,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:15,652 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:15,685 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:15,717 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:15,748 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:15,781 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:15,813 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:16,138 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5611896514892578 s; generated tokens: 20 tokens; generate speed: 12.81074338464997 tokens/s +2024-07-30 14:30:16,143 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:16,143 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1827/2067], cost time 1.5734s, every example cost time is 1.5734, generate speed: 12.7112 tokens/s, avg speed: 10.2225 tokens/s, remaining time: 0:05:27 +pred is: + ['1'] + label is: + ['committee'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:30:16,226 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:16,226 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 149, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:16,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:16,227 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:16,227 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:17,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:17,205 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:17,238 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:17,276 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:17,312 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:17,344 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:17,378 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:17,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:17,443 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:17,479 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:17,811 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5837781429290771 s; generated tokens: 20 tokens; generate speed: 12.628031324520947 tokens/s +2024-07-30 14:30:17,816 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:17,817 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1828/2067], cost time 1.5957s, every example cost time is 1.5957, generate speed: 12.5335 tokens/s, avg speed: 10.2239 tokens/s, remaining time: 0:05:26 +pred is: + ['MSPs'] + label is: + ['a small number of MSPs'] +The F1/Em of this example is: {'F1': 20.0, 'Em': 0.0} +2024-07-30 14:30:17,901 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:17,902 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 142, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:17,902 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:17,902 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:17,903 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:18,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:18,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:18,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:18,943 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:18,975 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:19,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:19,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:19,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:19,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:19,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:19,461 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5585813522338867 s; generated tokens: 20 tokens; generate speed: 12.832182273536352 tokens/s +2024-07-30 14:30:19,466 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:19,467 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1829/2067], cost time 1.5704s, every example cost time is 1.5704, generate speed: 12.7357 tokens/s, avg speed: 10.2255 tokens/s, remaining time: 0:05:25 +pred is: + ['at the beginning of each parliamentary session'] + label is: + ['beginning of each parliamentary session'] +The F1/Em of this example is: {'F1': 81.81818181818181, 'Em': 0.0} +2024-07-30 14:30:19,550 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:19,551 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 159, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:19,551 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:19,552 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:19,552 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:20,496 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:20,529 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:20,563 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:20,596 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:20,628 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:20,632 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0800690650939941 s; generated tokens: 5 tokens; generate speed: 4.629333587630223 tokens/s +2024-07-30 14:30:20,637 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:20,637 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1830/2067], cost time 1.0921s, every example cost time is 1.0921, generate speed: 4.5782 tokens/s, avg speed: 10.2231 tokens/s, remaining time: 0:05:23 +pred is: + ['Private Bill Committees'] + label is: + ['type of committee'] +The F1/Em of this example is: {'F1': 20.000000000000004, 'Em': 0.0} +F1 score: 62.44189321911453, Em score: 47.814207650273225, current_count: 1830 +2024-07-30 14:30:21,266 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:21,266 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 248, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:21,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:21,267 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:21,267 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:22,212 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:22,246 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:22,280 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:22,312 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:22,343 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:22,377 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:22,419 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:22,452 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:22,485 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:22,517 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:22,713 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4454119205474854 s; generated tokens: 16 tokens; generate speed: 11.069508817901271 tokens/s +2024-07-30 14:30:22,718 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:22,718 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1831/2067], cost time 1.4573s, every example cost time is 1.4573, generate speed: 10.9791 tokens/s, avg speed: 10.2235 tokens/s, remaining time: 0:05:22 +pred is: + ['The Scotland Act 1998'] + label is: + ['Scotland Act 1998'] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +2024-07-30 14:30:22,802 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:22,802 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 199, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:22,803 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:22,803 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:22,803 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:23,747 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:23,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:23,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:23,846 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:23,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:23,912 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:23,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:23,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:24,008 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:24,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:24,144 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3401601314544678 s; generated tokens: 13 tokens; generate speed: 9.700333336950695 tokens/s +2024-07-30 14:30:24,149 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:24,149 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1832/2067], cost time 1.3522s, every example cost time is 1.3522, generate speed: 9.6142 tokens/s, avg speed: 10.2232 tokens/s, remaining time: 0:05:21 +pred is: + ['Schedule 5 to the Scotland Act'] + label is: + ['Schedule 5'] +The F1/Em of this example is: {'F1': 42.857142857142854, 'Em': 0.0} +2024-07-30 14:30:24,233 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:24,233 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 180, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:24,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:24,234 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:24,234 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:25,178 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:25,211 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:25,243 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:25,276 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:25,280 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0451221466064453 s; generated tokens: 4 tokens; generate speed: 3.827303835238938 tokens/s +2024-07-30 14:30:25,284 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:25,285 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1833/2067], cost time 1.0569s, every example cost time is 1.0569, generate speed: 3.7848 tokens/s, avg speed: 10.2204 tokens/s, remaining time: 0:05:19 +pred is: + ['Reserved matters'] + label is: + ['Reserved'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:30:25,368 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:25,368 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 150, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:25,369 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:25,369 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:25,369 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:26,313 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:26,346 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:26,379 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:26,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:26,414 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0448577404022217 s; generated tokens: 4 tokens; generate speed: 3.828272352617291 tokens/s +2024-07-30 14:30:26,419 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:26,419 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1834/2067], cost time 1.0566s, every example cost time is 1.0566, generate speed: 3.7857 tokens/s, avg speed: 10.2177 tokens/s, remaining time: 0:05:18 +pred is: + ['A bill'] + label is: + ['Bills'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:30:26,502 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:26,503 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 210, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:26,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:26,503 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:26,504 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:27,447 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:27,481 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:27,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:27,544 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:27,580 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:27,613 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:27,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:27,679 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:27,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:27,742 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:28,073 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5695664882659912 s; generated tokens: 20 tokens; generate speed: 12.742371953987998 tokens/s +2024-07-30 14:30:28,078 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:28,079 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1835/2067], cost time 1.5813s, every example cost time is 1.5813, generate speed: 12.6475 tokens/s, avg speed: 10.2193 tokens/s, remaining time: 0:05:16 +pred is: + ['The first, or introductory stage of the bill, where the minister or member in charge of the'] + label is: + ['introductory'] +The F1/Em of this example is: {'F1': 5.555555555555556, 'Em': 0.0} +2024-07-30 14:30:28,163 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:28,164 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:28,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:28,164 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:28,164 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:29,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:29,141 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:29,175 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:29,208 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:29,240 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:29,244 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0794222354888916 s; generated tokens: 5 tokens; generate speed: 4.632107655013612 tokens/s +2024-07-30 14:30:29,249 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:29,249 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1836/2067], cost time 1.0913s, every example cost time is 1.0913, generate speed: 4.5816 tokens/s, avg speed: 10.2168 tokens/s, remaining time: 0:05:15 +pred is: + ['Stage 3'] + label is: + ['Stage 3'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:30:29,332 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:29,333 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 190, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:29,333 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:29,333 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:29,334 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:30,278 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:30,311 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:30,344 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:30,377 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:30,410 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:30,413 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.07938814163208 s; generated tokens: 5 tokens; generate speed: 4.632253966066174 tokens/s +2024-07-30 14:30:30,418 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:30,418 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1837/2067], cost time 1.0909s, every example cost time is 1.0909, generate speed: 4.5832 tokens/s, avg speed: 10.2144 tokens/s, remaining time: 0:05:14 +pred is: + ['The Monarch'] + label is: + ['the Monarch'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:30:30,502 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:30,502 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 266, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:30,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:30,503 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:30,503 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:31,449 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:31,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:31,519 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:31,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:31,585 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:31,616 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:31,647 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:31,680 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:31,712 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:31,744 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:32,032 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5289907455444336 s; generated tokens: 19 tokens; generate speed: 12.42649771123016 tokens/s +2024-07-30 14:30:32,037 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:32,037 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1838/2067], cost time 1.5408s, every example cost time is 1.5408, generate speed: 12.3315 tokens/s, avg speed: 10.2157 tokens/s, remaining time: 0:05:12 +pred is: + ['The Scottish National Party'] + label is: + ['hold the majority of seats'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 14:30:32,121 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:32,121 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 272, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:32,121 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:32,122 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:32,122 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:33,067 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:33,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:33,132 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:33,135 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0133628845214844 s; generated tokens: 3 tokens; generate speed: 2.9604399823826357 tokens/s +2024-07-30 14:30:33,140 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:33,141 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1839/2067], cost time 1.0250s, every example cost time is 1.0250, generate speed: 2.9269 tokens/s, avg speed: 10.2127 tokens/s, remaining time: 0:05:11 +pred is: + ['Thursday'] + label is: + ['Thursday'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:30:33,224 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:33,224 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 146, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:33,225 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:33,225 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:33,225 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:34,169 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:34,205 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:34,237 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:34,270 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:34,301 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:34,333 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:34,371 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:34,404 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:34,436 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:34,470 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:34,785 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5598547458648682 s; generated tokens: 20 tokens; generate speed: 12.821706670457264 tokens/s +2024-07-30 14:30:34,790 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:34,791 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1840/2067], cost time 1.5716s, every example cost time is 1.5716, generate speed: 12.7262 tokens/s, avg speed: 10.2143 tokens/s, remaining time: 0:05:09 +pred is: + ['The First Minister or members of the cabinet can deliver statements to Parliament upon which MSPs are invited'] + label is: + ['Several procedures'] +The F1/Em of this example is: {'F1': 5.263157894736842, 'Em': 0.0} +F1 score: 62.38080096772845, Em score: 47.71739130434783, current_count: 1840 +2024-07-30 14:30:35,425 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:35,425 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 253, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:35,425 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:35,426 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:35,426 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:36,370 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:36,404 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:36,435 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:36,469 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:36,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:36,532 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:36,535 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1088802814483643 s; generated tokens: 6 tokens; generate speed: 5.41086364360551 tokens/s +2024-07-30 14:30:36,540 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:36,540 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1841/2067], cost time 1.1207s, every example cost time is 1.1207, generate speed: 5.3540 tokens/s, avg speed: 10.2121 tokens/s, remaining time: 0:05:08 +pred is: + ['Parliamentary time'] + label is: + ['Parliamentary time'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:30:36,623 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:36,624 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 302, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:36,624 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:36,625 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:36,625 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:37,571 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:37,604 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:37,636 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:37,641 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0160179138183594 s; generated tokens: 3 tokens; generate speed: 2.9527038442910083 tokens/s +2024-07-30 14:30:37,646 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:37,646 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1842/2067], cost time 1.0282s, every example cost time is 1.0282, generate speed: 2.9177 tokens/s, avg speed: 10.2091 tokens/s, remaining time: 0:05:07 +pred is: + ['73'] + label is: + ['73'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:30:37,729 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:37,729 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:37,730 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:37,730 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:37,730 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:38,674 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:38,707 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:38,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:38,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:38,812 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:38,844 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:38,877 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:38,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:38,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:38,976 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:39,303 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5721945762634277 s; generated tokens: 20 tokens; generate speed: 12.721071743888853 tokens/s +2024-07-30 14:30:39,307 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:39,308 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1843/2067], cost time 1.5842s, every example cost time is 1.5842, generate speed: 12.6248 tokens/s, avg speed: 10.2106 tokens/s, remaining time: 0:05:05 +pred is: + ['Proportionally to the number of votes received in the second vote of the ballot using the d'] + label is: + ['proportionally to the number of votes received'] +The F1/Em of this example is: {'F1': 56.52173913043478, 'Em': 0.0} +2024-07-30 14:30:39,394 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:39,394 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 219, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:39,395 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:39,395 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:39,395 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:40,339 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:40,374 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:40,408 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:40,441 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:40,476 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:40,508 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:40,540 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:40,575 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:40,607 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:40,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:40,971 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5756940841674805 s; generated tokens: 20 tokens; generate speed: 12.69281912076672 tokens/s +2024-07-30 14:30:40,976 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:40,976 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1844/2067], cost time 1.5875s, every example cost time is 1.5875, generate speed: 12.5981 tokens/s, avg speed: 10.2121 tokens/s, remaining time: 0:05:04 +pred is: + ['1'] + label is: + ['a number of qualifications'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:30:41,060 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:41,061 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 157, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:41,061 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:41,062 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:41,062 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:42,005 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:42,039 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:42,072 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:42,104 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:42,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:42,169 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:42,201 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:42,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:42,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:42,300 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:42,635 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5728650093078613 s; generated tokens: 20 tokens; generate speed: 12.71564939244277 tokens/s +2024-07-30 14:30:42,640 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:42,640 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1845/2067], cost time 1.5851s, every example cost time is 1.5851, generate speed: 12.6173 tokens/s, avg speed: 10.2136 tokens/s, remaining time: 0:05:03 +pred is: + ['1'] + label is: + ['a party has commanded a parliamentary majority'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:30:42,725 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:42,725 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 152, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:42,726 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:42,726 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:42,726 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:43,670 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:43,703 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:43,735 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:43,769 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:43,801 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:43,833 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:43,867 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:43,899 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:43,931 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:43,965 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:44,296 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5693330764770508 s; generated tokens: 20 tokens; generate speed: 12.744267166596275 tokens/s +2024-07-30 14:30:44,301 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:44,301 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1846/2067], cost time 1.5812s, every example cost time is 1.5812, generate speed: 12.6488 tokens/s, avg speed: 10.2152 tokens/s, remaining time: 0:05:01 +pred is: + ['The Conservatives'] + label is: + ['the Conservatives'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:30:44,386 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:44,387 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:44,387 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:44,387 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:44,387 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:45,331 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:45,368 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:45,401 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:45,439 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:45,474 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:45,506 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:45,538 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:45,572 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:45,604 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:45,635 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:45,959 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5716352462768555 s; generated tokens: 20 tokens; generate speed: 12.725599051929667 tokens/s +2024-07-30 14:30:45,964 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:45,965 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1847/2067], cost time 1.5838s, every example cost time is 1.5838, generate speed: 12.6282 tokens/s, avg speed: 10.2167 tokens/s, remaining time: 0:05:00 +pred is: + ['They are able to vote on domestic legislation that applies only to England, Wales and Northern Ireland'] + label is: + ['able to vote on domestic legislation that applies only to England, Wales and Northern Ireland'] +The F1/Em of this example is: {'F1': 93.75, 'Em': 0.0} +2024-07-30 14:30:46,052 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:46,052 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 215, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:46,052 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:46,053 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:46,053 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:46,997 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:47,031 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:47,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:47,097 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:47,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:47,162 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:47,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:47,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:47,259 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:47,291 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:47,611 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5582499504089355 s; generated tokens: 20 tokens; generate speed: 12.834911366274293 tokens/s +2024-07-30 14:30:47,616 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:47,617 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1848/2067], cost time 1.5705s, every example cost time is 1.5705, generate speed: 12.7350 tokens/s, avg speed: 10.2183 tokens/s, remaining time: 0:04:59 +pred is: + ['Islamism'] + label is: + ['Islamism'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:30:47,701 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:47,701 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 201, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:47,702 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:47,702 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:47,702 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:48,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:48,680 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:48,713 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:48,745 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:48,749 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0466344356536865 s; generated tokens: 4 tokens; generate speed: 3.821773738508573 tokens/s +2024-07-30 14:30:48,754 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:48,754 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1849/2067], cost time 1.0583s, every example cost time is 1.0583, generate speed: 3.7795 tokens/s, avg speed: 10.2156 tokens/s, remaining time: 0:04:57 +pred is: + ['Democratic process'] + label is: + ['democratic'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:30:48,838 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:48,839 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 261, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:48,839 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:48,840 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:48,840 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:49,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:49,819 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:49,852 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:49,894 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:49,926 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:49,929 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0892415046691895 s; generated tokens: 5 tokens; generate speed: 4.590350237818505 tokens/s +2024-07-30 14:30:49,934 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:49,935 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1850/2067], cost time 1.1015s, every example cost time is 1.1015, generate speed: 4.5394 tokens/s, avg speed: 10.2131 tokens/s, remaining time: 0:04:56 +pred is: + ['A major division'] + label is: + ['major division'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +F1 score: 62.408619199865285, Em score: 47.67567567567568, current_count: 1850 +2024-07-30 14:30:50,577 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:50,577 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:50,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:50,578 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:50,578 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:51,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:51,555 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:51,587 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:51,618 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:51,649 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:51,681 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:51,716 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:51,748 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:51,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:51,815 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:52,111 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5328471660614014 s; generated tokens: 19 tokens; generate speed: 12.3952344504246 tokens/s +2024-07-30 14:30:52,117 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:52,117 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1851/2067], cost time 1.5452s, every example cost time is 1.5452, generate speed: 12.2961 tokens/s, avg speed: 10.2144 tokens/s, remaining time: 0:04:55 +pred is: + ['1'] + label is: + ['political'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:30:52,201 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:52,201 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 193, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:52,201 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:52,202 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:52,202 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:53,146 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:53,180 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:53,212 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:53,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:53,277 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:53,310 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:53,342 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:53,375 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:53,408 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:53,440 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:53,777 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5747711658477783 s; generated tokens: 20 tokens; generate speed: 12.700257938259236 tokens/s +2024-07-30 14:30:53,782 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:53,782 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1852/2067], cost time 1.5869s, every example cost time is 1.5869, generate speed: 12.6033 tokens/s, avg speed: 10.2159 tokens/s, remaining time: 0:04:53 +pred is: + ['1'] + label is: + ['Muslims'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:30:53,866 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:53,866 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 185, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:53,867 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:53,867 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:53,867 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:54,811 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:54,846 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:54,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:54,912 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:54,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:54,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:55,009 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:55,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:55,074 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:55,106 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:55,441 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5729169845581055 s; generated tokens: 20 tokens; generate speed: 12.715229218291384 tokens/s +2024-07-30 14:30:55,446 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:55,446 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1853/2067], cost time 1.5855s, every example cost time is 1.5855, generate speed: 12.6147 tokens/s, avg speed: 10.2174 tokens/s, remaining time: 0:04:52 +pred is: + ['Enemies'] + label is: + ['dangerous enemies'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:30:55,530 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:55,531 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 225, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:55,531 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:55,532 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:55,532 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:56,477 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:56,510 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:56,542 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:56,575 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:56,607 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:56,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:56,673 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:56,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:56,737 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:56,770 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:57,095 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5624260902404785 s; generated tokens: 20 tokens; generate speed: 12.800605497391386 tokens/s +2024-07-30 14:30:57,099 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:57,100 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1854/2067], cost time 1.5748s, every example cost time is 1.5748, generate speed: 12.7000 tokens/s, avg speed: 10.2189 tokens/s, remaining time: 0:04:50 +pred is: + ['Anwar Sadat'] + label is: + ['Anwar Sadat'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:30:57,184 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:57,184 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 205, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:57,184 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:57,185 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:57,185 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:58,130 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:58,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:58,197 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:58,230 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:58,263 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:58,296 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:58,327 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:58,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:58,392 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:58,423 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:58,743 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5579559803009033 s; generated tokens: 20 tokens; generate speed: 12.837333180708484 tokens/s +2024-07-30 14:30:58,748 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:30:58,748 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1855/2067], cost time 1.5699s, every example cost time is 1.5699, generate speed: 12.7394 tokens/s, avg speed: 10.2205 tokens/s, remaining time: 0:04:49 +pred is: + ['Strict, conservative'] + label is: + ['conservative'] +The F1/Em of this example is: {'F1': 40.0, 'Em': 0.0} +2024-07-30 14:30:58,832 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:30:58,832 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 139, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:30:58,832 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:58,833 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:30:58,833 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:30:59,776 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:59,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:59,842 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:59,877 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:59,909 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:59,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:30:59,973 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:00,005 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:00,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:00,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:00,388 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5545599460601807 s; generated tokens: 20 tokens; generate speed: 12.865377144630068 tokens/s +2024-07-30 14:31:00,393 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:00,393 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1856/2067], cost time 1.5663s, every example cost time is 1.5663, generate speed: 12.7686 tokens/s, avg speed: 10.2220 tokens/s, remaining time: 0:04:48 +pred is: + ['1'] + label is: + ['Islamist'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:31:00,477 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:00,477 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 209, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:00,478 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:00,478 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:00,478 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:01,423 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:01,457 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:01,489 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:01,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:01,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:01,556 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0779995918273926 s; generated tokens: 5 tokens; generate speed: 4.638220680143441 tokens/s +2024-07-30 14:31:01,561 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:01,562 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1857/2067], cost time 1.0899s, every example cost time is 1.0899, generate speed: 4.5877 tokens/s, avg speed: 10.2196 tokens/s, remaining time: 0:04:46 +pred is: + ['Law and philosophy'] + label is: + ['law and philosophy'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:31:01,645 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:01,646 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 206, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:01,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:01,647 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:01,647 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:02,591 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:02,625 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:02,657 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:02,689 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:02,720 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:02,751 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:02,781 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:02,813 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:02,844 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:02,875 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:03,185 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5378131866455078 s; generated tokens: 20 tokens; generate speed: 13.0054808826466 tokens/s +2024-07-30 14:31:03,190 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:03,190 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1858/2067], cost time 1.5496s, every example cost time is 1.5496, generate speed: 12.9066 tokens/s, avg speed: 10.2213 tokens/s, remaining time: 0:04:45 +pred is: + ['Secularism and secular nationalism'] + label is: + ['secularism and secular nationalism'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:31:03,274 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:03,274 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 209, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:03,274 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:03,275 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:03,275 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:04,218 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:04,252 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:04,283 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:04,315 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:04,346 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:04,378 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:04,410 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:04,441 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:04,473 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:04,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:04,728 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4526481628417969 s; generated tokens: 17 tokens; generate speed: 11.702764946704727 tokens/s +2024-07-30 14:31:04,733 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:04,733 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1859/2067], cost time 1.4641s, every example cost time is 1.4641, generate speed: 11.6115 tokens/s, avg speed: 10.2221 tokens/s, remaining time: 0:04:44 +pred is: + ['Sayyid Abul Ala Maududi'] + label is: + ['Sayyid Abul Ala Maududi'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:31:04,816 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:04,816 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 174, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:04,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:04,817 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:04,817 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:05,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:05,794 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:05,827 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:05,860 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:05,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:05,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:05,956 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:05,988 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:06,020 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:06,053 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:06,381 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5637285709381104 s; generated tokens: 20 tokens; generate speed: 12.789943454190148 tokens/s +2024-07-30 14:31:06,386 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:06,386 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1860/2067], cost time 1.5751s, every example cost time is 1.5751, generate speed: 12.6976 tokens/s, avg speed: 10.2236 tokens/s, remaining time: 0:04:42 +pred is: + ['Sharia'] + label is: + ['Sharia'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.390293290188595, Em score: 47.68817204301075, current_count: 1860 +2024-07-30 14:31:07,027 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:07,028 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 164, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:07,028 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:07,028 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:07,029 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:07,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:08,005 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:08,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:08,070 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:08,074 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0454738140106201 s; generated tokens: 4 tokens; generate speed: 3.82601644000561 tokens/s +2024-07-30 14:31:08,079 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:08,079 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1861/2067], cost time 1.0574s, every example cost time is 1.0574, generate speed: 3.7830 tokens/s, avg speed: 10.2209 tokens/s, remaining time: 0:04:41 +pred is: + ['1928'] + label is: + ['1928'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:31:08,163 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:08,163 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 146, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:08,164 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:08,164 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:08,164 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:09,107 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:09,141 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:09,174 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:09,206 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:09,239 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:09,272 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:09,304 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:09,336 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:09,368 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:09,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:09,722 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.557276964187622 s; generated tokens: 20 tokens; generate speed: 12.842930615385628 tokens/s +2024-07-30 14:31:09,727 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:09,727 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1862/2067], cost time 1.5693s, every example cost time is 1.5693, generate speed: 12.7443 tokens/s, avg speed: 10.2225 tokens/s, remaining time: 0:04:40 +pred is: + ['1'] + label is: + ['violence'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:31:09,811 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:09,811 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 192, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:09,812 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:09,812 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:09,812 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:10,756 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:10,790 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:10,822 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:10,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:10,887 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:10,919 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:10,967 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:11,000 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:11,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:11,065 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:11,392 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5794024467468262 s; generated tokens: 20 tokens; generate speed: 12.663016979108141 tokens/s +2024-07-30 14:31:11,396 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:11,397 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1863/2067], cost time 1.5912s, every example cost time is 1.5912, generate speed: 12.5689 tokens/s, avg speed: 10.2239 tokens/s, remaining time: 0:04:38 +pred is: + ['Influential'] + label is: + ['one of the most influential movements'] +The F1/Em of this example is: {'F1': 16.666666666666668, 'Em': 0.0} +2024-07-30 14:31:11,481 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:11,482 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 166, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:11,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:11,482 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:11,482 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:12,426 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:12,460 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:12,493 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:12,525 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:12,557 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:12,590 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:12,622 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:12,654 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:12,687 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:12,719 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:13,066 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.583832025527954 s; generated tokens: 20 tokens; generate speed: 12.627601713845385 tokens/s +2024-07-30 14:31:13,071 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:13,072 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1864/2067], cost time 1.5958s, every example cost time is 1.5958, generate speed: 12.5330 tokens/s, avg speed: 10.2254 tokens/s, remaining time: 0:04:37 +pred is: + ['A pivotal event'] + label is: + ['quick and decisive'] +The F1/Em of this example is: {'F1': 20.000000000000004, 'Em': 0.0} +2024-07-30 14:31:13,154 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:13,155 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 183, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:13,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:13,156 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:13,156 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:14,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:14,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:14,168 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:14,201 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:14,233 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:14,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:14,300 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:14,332 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:14,365 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:14,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:14,721 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5645694732666016 s; generated tokens: 20 tokens; generate speed: 12.783069299085074 tokens/s +2024-07-30 14:31:14,726 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:14,726 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1865/2067], cost time 1.5767s, every example cost time is 1.5767, generate speed: 12.6845 tokens/s, avg speed: 10.2269 tokens/s, remaining time: 0:04:36 +pred is: + ['Ideological'] + label is: + ['ideological'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:31:14,810 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:14,810 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 164, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:14,811 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:14,811 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:14,811 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:15,754 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:15,788 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:15,820 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:15,853 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:15,886 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:15,918 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:15,950 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:15,983 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:16,015 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:16,047 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:16,374 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5630805492401123 s; generated tokens: 20 tokens; generate speed: 12.795245907015445 tokens/s +2024-07-30 14:31:16,379 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:16,380 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1866/2067], cost time 1.5750s, every example cost time is 1.5750, generate speed: 12.6984 tokens/s, avg speed: 10.2284 tokens/s, remaining time: 0:04:34 +pred is: + ['Islamic Republic'] + label is: + ['Islamic'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:31:16,464 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:16,464 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 183, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:16,465 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:16,465 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:16,465 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:17,409 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:17,443 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:17,476 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:17,509 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:17,541 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:17,574 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:17,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:17,638 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:17,671 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:17,704 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:18,029 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5632705688476562 s; generated tokens: 20 tokens; generate speed: 12.793690611563633 tokens/s +2024-07-30 14:31:18,033 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:18,034 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1867/2067], cost time 1.5753s, every example cost time is 1.5753, generate speed: 12.6962 tokens/s, avg speed: 10.2300 tokens/s, remaining time: 0:04:33 +pred is: + ['Soviet Union'] + label is: + ['the Soviet Union'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:31:18,150 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:18,150 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 174, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:18,151 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:18,151 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:18,151 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:19,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:19,128 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:19,161 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:19,194 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:19,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:19,263 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:19,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:19,349 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:19,382 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:19,414 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:19,740 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5885882377624512 s; generated tokens: 20 tokens; generate speed: 12.589794840839486 tokens/s +2024-07-30 14:31:19,745 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:19,745 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1868/2067], cost time 1.6008s, every example cost time is 1.6008, generate speed: 12.4936 tokens/s, avg speed: 10.2314 tokens/s, remaining time: 0:04:32 +pred is: + ['It brought several hundred thousand US and allied non-Muslim military personnel to Saudi Arabian soil to put an'] + label is: + ['worked to radicalize the Islamist movement'] +The F1/Em of this example is: {'F1': 13.043478260869563, 'Em': 0.0} +2024-07-30 14:31:19,829 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:19,829 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 202, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:19,830 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:19,830 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:19,830 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:20,775 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:20,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:20,840 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:20,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:20,905 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:20,937 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:20,969 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:21,001 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:21,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:21,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:21,286 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4560213088989258 s; generated tokens: 17 tokens; generate speed: 11.675653299920288 tokens/s +2024-07-30 14:31:21,291 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:21,292 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1869/2067], cost time 1.4678s, every example cost time is 1.4678, generate speed: 11.5820 tokens/s, avg speed: 10.2322 tokens/s, remaining time: 0:04:30 +pred is: + ['Conservative Muslims'] + label is: + ['conservative Muslims'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:31:21,375 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:21,375 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 171, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:21,376 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:21,376 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:21,376 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:22,320 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:22,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:22,386 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:22,418 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:22,449 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:22,481 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:22,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:22,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:22,575 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:22,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:22,920 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5438275337219238 s; generated tokens: 20 tokens; generate speed: 12.95481494087825 tokens/s +2024-07-30 14:31:22,925 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:22,925 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1870/2067], cost time 1.5556s, every example cost time is 1.5556, generate speed: 12.8565 tokens/s, avg speed: 10.2337 tokens/s, remaining time: 0:04:29 +pred is: + ["Qutb's"] + label is: + ["Qutb's"] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.363986986459004, Em score: 47.64705882352941, current_count: 1870 +2024-07-30 14:31:23,603 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:23,604 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 151, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:23,604 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:23,604 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:23,604 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:24,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:24,580 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:24,611 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:24,643 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:24,674 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:24,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:24,736 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:24,739 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1347224712371826 s; generated tokens: 7 tokens; generate speed: 6.168909294946748 tokens/s +2024-07-30 14:31:24,744 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:24,745 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1871/2067], cost time 1.1467s, every example cost time is 1.1467, generate speed: 6.1044 tokens/s, avg speed: 10.2319 tokens/s, remaining time: 0:04:27 +pred is: + ['Egyptian Islamic Jihad organization'] + label is: + ['Egyptian Islamic Jihad organization'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:31:24,827 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:24,828 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 238, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:24,828 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:24,828 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:24,829 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:25,773 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:25,806 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:25,838 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:25,870 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:25,902 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:25,933 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:25,965 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:25,997 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:26,028 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:26,059 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:26,375 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5459182262420654 s; generated tokens: 20 tokens; generate speed: 12.937294910234359 tokens/s +2024-07-30 14:31:26,380 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:26,380 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1872/2067], cost time 1.5576s, every example cost time is 1.5576, generate speed: 12.8401 tokens/s, avg speed: 10.2335 tokens/s, remaining time: 0:04:26 +pred is: + ['violence'] + label is: + ['violence'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:31:26,462 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:26,463 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 263, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:26,463 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:26,463 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:26,464 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:27,409 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:27,466 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:27,499 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:27,530 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:27,567 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:27,571 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1066746711730957 s; generated tokens: 5 tokens; generate speed: 4.51803961023153 tokens/s +2024-07-30 14:31:27,575 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:27,576 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1873/2067], cost time 1.1184s, every example cost time is 1.1184, generate speed: 4.4708 tokens/s, avg speed: 10.2310 tokens/s, remaining time: 0:04:25 +pred is: + ['quiescent'] + label is: + ['quiescent'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:31:27,659 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:27,659 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:27,659 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:27,660 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:27,660 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:28,604 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:28,637 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:28,670 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:28,702 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:28,734 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:28,767 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:28,799 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:28,830 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:28,863 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:28,895 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:28,929 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2688169479370117 s; generated tokens: 11 tokens; generate speed: 8.669493277091753 tokens/s +2024-07-30 14:31:28,934 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:28,934 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1874/2067], cost time 1.2808s, every example cost time is 1.2808, generate speed: 8.5882 tokens/s, avg speed: 10.2301 tokens/s, remaining time: 0:04:23 +pred is: + ['Hamas'] + label is: + ['Hamas'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:31:29,018 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:29,018 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 148, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:29,019 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:29,019 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:29,019 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:29,963 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:29,996 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:30,027 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:30,059 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:30,090 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:30,121 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:30,153 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:30,214 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:30,247 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:30,279 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:30,599 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.579240083694458 s; generated tokens: 20 tokens; generate speed: 12.664318874944085 tokens/s +2024-07-30 14:31:30,604 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:30,604 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1875/2067], cost time 1.5910s, every example cost time is 1.5910, generate speed: 12.5705 tokens/s, avg speed: 10.2316 tokens/s, remaining time: 0:04:22 +pred is: + ['Islamist'] + label is: + ['Islamist'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:31:30,686 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:30,687 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 187, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:30,687 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:30,688 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:30,688 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:31,631 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:31,665 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:31,697 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:31,729 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:31,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:31,792 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:31,823 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:31,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:31,885 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:31,916 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:32,228 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5399186611175537 s; generated tokens: 20 tokens; generate speed: 12.987698964233312 tokens/s +2024-07-30 14:31:32,233 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:32,233 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1876/2067], cost time 1.5517s, every example cost time is 1.5517, generate speed: 12.8895 tokens/s, avg speed: 10.2332 tokens/s, remaining time: 0:04:21 +pred is: + ['1985'] + label is: + ['1985'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:31:32,316 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:32,316 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 233, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:32,316 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:32,317 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:32,317 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:33,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:33,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:33,327 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:33,358 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:33,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:33,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:33,455 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:33,487 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:33,519 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:33,550 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:33,739 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4219088554382324 s; generated tokens: 16 tokens; generate speed: 11.252479326509855 tokens/s +2024-07-30 14:31:33,744 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:33,744 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1877/2067], cost time 1.4336s, every example cost time is 1.4336, generate speed: 11.1610 tokens/s, avg speed: 10.2337 tokens/s, remaining time: 0:04:19 +pred is: + ['stay home to alleviate the high rate of unemployment among young Algerian men'] + label is: + ['staying home'] +The F1/Em of this example is: {'F1': 14.285714285714285, 'Em': 0.0} +2024-07-30 14:31:33,828 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:33,828 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 185, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:33,828 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:33,829 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:33,829 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:34,772 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:34,806 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:34,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:34,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:34,900 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:34,903 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0736327171325684 s; generated tokens: 5 tokens; generate speed: 4.657086096774208 tokens/s +2024-07-30 14:31:34,907 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:34,908 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1878/2067], cost time 1.0852s, every example cost time is 1.0852, generate speed: 4.6075 tokens/s, avg speed: 10.2313 tokens/s, remaining time: 0:04:18 +pred is: + ['justice and prosperity'] + label is: + ['justice and prosperity'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:31:34,992 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:34,992 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 162, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:34,992 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:34,992 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:34,993 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:35,936 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:35,969 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:36,001 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:36,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:36,063 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:36,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:36,124 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:36,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:36,158 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1654319763183594 s; generated tokens: 8 tokens; generate speed: 6.864407500875582 tokens/s +2024-07-30 14:31:36,163 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:36,163 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1879/2067], cost time 1.1767s, every example cost time is 1.1767, generate speed: 6.7988 tokens/s, avg speed: 10.2298 tokens/s, remaining time: 0:04:17 +pred is: + ['Taliban'] + label is: + ['The Taliban'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:31:36,246 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:36,246 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 311, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:36,247 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:36,247 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:36,247 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:37,193 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:37,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:37,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:37,289 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:37,320 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:37,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:37,382 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:37,413 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:37,444 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:37,475 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:37,508 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2611114978790283 s; generated tokens: 11 tokens; generate speed: 8.722464285275409 tokens/s +2024-07-30 14:31:37,513 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:37,513 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1880/2067], cost time 1.2722s, every example cost time is 1.2722, generate speed: 8.6461 tokens/s, avg speed: 10.2290 tokens/s, remaining time: 0:04:15 +pred is: + ['1977'] + label is: + ['July 1977'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +F1 score: 62.465394350512796, Em score: 47.765957446808514, current_count: 1880 +2024-07-30 14:31:38,156 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:38,156 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:38,157 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:38,157 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:38,157 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:39,102 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:39,135 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:39,166 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:39,197 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:39,228 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:39,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:39,289 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:39,320 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:39,350 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:39,381 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:39,726 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5688889026641846 s; generated tokens: 20 tokens; generate speed: 12.747875242177638 tokens/s +2024-07-30 14:31:39,731 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:39,732 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1881/2067], cost time 1.5806s, every example cost time is 1.5806, generate speed: 12.6531 tokens/s, avg speed: 10.2305 tokens/s, remaining time: 0:04:14 +pred is: + ['Extremist militant group'] + label is: + ['Wahhabi/Salafi jihadist extremist militant'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:31:39,814 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:39,814 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 269, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:39,815 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:39,815 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:39,815 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:40,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:40,793 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:40,824 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:40,855 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:40,886 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:40,917 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:40,949 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:40,980 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:41,011 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:41,042 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:41,322 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5063893795013428 s; generated tokens: 19 tokens; generate speed: 12.61294075658548 tokens/s +2024-07-30 14:31:41,327 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:41,327 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1882/2067], cost time 1.5180s, every example cost time is 1.5180, generate speed: 12.5168 tokens/s, avg speed: 10.2318 tokens/s, remaining time: 0:04:12 +pred is: + ['2004'] + label is: + ['2004'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:31:41,410 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:41,410 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 165, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:41,411 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:41,411 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:41,411 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:42,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:42,391 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:42,423 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:42,455 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:42,487 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:42,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:42,549 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:42,581 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:42,613 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:42,644 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:42,978 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5663678646087646 s; generated tokens: 20 tokens; generate speed: 12.768392694902131 tokens/s +2024-07-30 14:31:42,983 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:42,983 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1883/2067], cost time 1.5777s, every example cost time is 1.5777, generate speed: 12.6768 tokens/s, avg speed: 10.2333 tokens/s, remaining time: 0:04:11 +pred is: + ["HT sees Islam's pivotal turning point as occurring not with the death of Ali, or one of"] + label is: + ['a different view'] +The F1/Em of this example is: {'F1': 4.878048780487805, 'Em': 0.0} +2024-07-30 14:31:43,067 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:43,067 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 168, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:43,068 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:43,068 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:43,068 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:44,011 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:44,045 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:44,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:44,107 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:44,139 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:44,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:44,203 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:44,236 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:44,268 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:44,300 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:44,613 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5447678565979004 s; generated tokens: 20 tokens; generate speed: 12.94692915480954 tokens/s +2024-07-30 14:31:44,618 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:44,618 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1884/2067], cost time 1.5565s, every example cost time is 1.5565, generate speed: 12.8496 tokens/s, avg speed: 10.2349 tokens/s, remaining time: 0:04:10 +pred is: + ['Armed jihad'] + label is: + ['armed'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:31:44,701 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:44,701 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 194, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:44,701 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:44,702 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:44,702 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:45,645 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:45,678 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:45,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:45,741 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:45,772 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:45,803 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:45,834 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:45,866 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:45,898 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:45,929 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:46,242 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5402781963348389 s; generated tokens: 20 tokens; generate speed: 12.98466734619168 tokens/s +2024-07-30 14:31:46,247 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:46,248 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1885/2067], cost time 1.5518s, every example cost time is 1.5518, generate speed: 12.8879 tokens/s, avg speed: 10.2365 tokens/s, remaining time: 0:04:08 +pred is: + ['900000'] + label is: + ['over 900,000'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:31:46,331 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:46,331 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 197, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:46,331 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:46,332 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:46,332 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:47,275 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:47,308 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:47,340 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:47,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:47,405 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:47,437 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:47,440 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1080448627471924 s; generated tokens: 6 tokens; generate speed: 5.414943204667823 tokens/s +2024-07-30 14:31:47,445 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:47,445 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1886/2067], cost time 1.1195s, every example cost time is 1.1195, generate speed: 5.3595 tokens/s, avg speed: 10.2344 tokens/s, remaining time: 0:04:07 +pred is: + ['Since 2001'] + label is: + ['since 2001'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:31:47,528 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:47,528 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 204, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:47,529 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:47,529 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:47,529 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:48,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:48,506 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:48,538 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:48,570 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:48,602 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:48,633 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:48,665 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:48,696 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:48,728 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:48,759 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:49,075 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.545839548110962 s; generated tokens: 20 tokens; generate speed: 12.937953375846986 tokens/s +2024-07-30 14:31:49,080 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:49,080 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1887/2067], cost time 1.5574s, every example cost time is 1.5574, generate speed: 12.8421 tokens/s, avg speed: 10.2360 tokens/s, remaining time: 0:04:06 +pred is: + ['Latin'] + label is: + ['Latin'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:31:49,164 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:49,164 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:49,165 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:49,165 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:49,165 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:50,120 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:50,154 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:50,185 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:50,216 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:50,247 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:50,278 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:50,309 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:50,340 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:50,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:50,403 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:50,593 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4276447296142578 s; generated tokens: 16 tokens; generate speed: 11.207270035818446 tokens/s +2024-07-30 14:31:50,598 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:50,598 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1888/2067], cost time 1.4393s, every example cost time is 1.4393, generate speed: 11.1167 tokens/s, avg speed: 10.2365 tokens/s, remaining time: 0:04:04 +pred is: + ['influence through diplomacy or military force'] + label is: + ['influence'] +The F1/Em of this example is: {'F1': 16.666666666666668, 'Em': 0.0} +2024-07-30 14:31:50,682 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:50,682 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 236, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:50,683 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:50,683 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:50,683 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:51,627 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:51,661 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:51,693 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:51,726 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:51,758 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:51,795 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:51,828 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:51,860 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:51,893 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:51,925 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:52,245 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5616259574890137 s; generated tokens: 20 tokens; generate speed: 12.807164163791574 tokens/s +2024-07-30 14:31:52,250 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:52,250 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1889/2067], cost time 1.5734s, every example cost time is 1.5734, generate speed: 12.7115 tokens/s, avg speed: 10.2380 tokens/s, remaining time: 0:04:03 +pred is: + ['1'] + label is: + ['"informal" imperialism'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:31:52,334 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:52,334 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 394, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:52,335 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:52,335 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:52,335 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:53,282 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:53,316 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:53,348 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:53,379 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:53,410 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:53,442 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:53,473 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:53,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:53,536 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:53,567 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:53,885 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5498723983764648 s; generated tokens: 20 tokens; generate speed: 12.90428813426871 tokens/s +2024-07-30 14:31:53,890 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:53,890 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1890/2067], cost time 1.5614s, every example cost time is 1.5614, generate speed: 12.8087 tokens/s, avg speed: 10.2395 tokens/s, remaining time: 0:04:02 +pred is: + ['1'] + label is: + ['distinction'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 62.357929150482114, Em score: 47.67195767195767, current_count: 1890 +2024-07-30 14:31:54,538 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:54,539 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 279, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:54,539 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:54,539 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:54,539 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:55,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:55,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:55,551 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:55,583 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:55,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:55,647 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:55,679 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:55,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:55,742 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:55,774 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:56,100 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5600147247314453 s; generated tokens: 20 tokens; generate speed: 12.820391809726653 tokens/s +2024-07-30 14:31:56,105 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:56,105 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1891/2067], cost time 1.5719s, every example cost time is 1.5719, generate speed: 12.7234 tokens/s, avg speed: 10.2410 tokens/s, remaining time: 0:04:00 +pred is: + ['Colonialism'] + label is: + ['colonialism'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:31:56,188 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:56,189 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 313, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:56,189 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:56,189 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:56,189 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:57,135 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:57,169 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:57,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:57,233 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:57,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:57,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:57,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:57,361 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:57,394 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:57,426 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:57,751 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5610151290893555 s; generated tokens: 20 tokens; generate speed: 12.812175633215892 tokens/s +2024-07-30 14:31:57,756 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:57,756 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1892/2067], cost time 1.5730s, every example cost time is 1.5730, generate speed: 12.7144 tokens/s, avg speed: 10.2425 tokens/s, remaining time: 0:03:59 +pred is: + ['1'] + label is: + ['Imperialism and colonialism'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:31:57,840 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:57,841 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 247, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:57,841 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:57,841 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:57,842 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:31:58,786 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:58,819 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:58,851 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:58,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:58,914 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:58,945 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:58,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:59,008 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:59,039 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:59,071 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:59,388 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5459768772125244 s; generated tokens: 20 tokens; generate speed: 12.936804097653146 tokens/s +2024-07-30 14:31:59,393 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:31:59,393 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1893/2067], cost time 1.5578s, every example cost time is 1.5578, generate speed: 12.8387 tokens/s, avg speed: 10.2441 tokens/s, remaining time: 0:03:58 +pred is: + ['the defense and justification of empire-building based on seemingly rational grounds'] + label is: + ['empire-building'] +The F1/Em of this example is: {'F1': 9.09090909090909, 'Em': 0.0} +2024-07-30 14:31:59,477 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:31:59,477 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 145, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:31:59,478 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:31:59,478 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:31:59,478 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:00,422 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:00,456 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:00,493 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:00,525 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:00,557 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:00,589 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:00,620 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:00,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:00,683 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:00,715 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:00,937 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4584956169128418 s; generated tokens: 17 tokens; generate speed: 11.655845792655477 tokens/s +2024-07-30 14:32:00,942 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:00,942 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1894/2067], cost time 1.4703s, every example cost time is 1.4703, generate speed: 11.5625 tokens/s, avg speed: 10.2448 tokens/s, remaining time: 0:03:56 +pred is: + ['Germany'] + label is: + ['Germany'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:32:01,026 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:01,026 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 165, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:01,027 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:01,027 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:01,027 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:01,971 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:02,004 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:02,036 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:02,068 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:02,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:02,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:02,163 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:02,195 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:02,226 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:02,257 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:02,572 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5444586277008057 s; generated tokens: 20 tokens; generate speed: 12.949521367091242 tokens/s +2024-07-30 14:32:02,577 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:02,577 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1895/2067], cost time 1.5564s, every example cost time is 1.5564, generate speed: 12.8498 tokens/s, avg speed: 10.2464 tokens/s, remaining time: 0:03:55 +pred is: + ['1'] + label is: + ['environmental determinism'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:32:02,671 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:02,672 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 148, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:02,672 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:02,673 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:02,673 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:03,616 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:03,649 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:03,682 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:03,715 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:03,718 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0447578430175781 s; generated tokens: 4 tokens; generate speed: 3.8286384033708565 tokens/s +2024-07-30 14:32:03,723 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:03,723 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1896/2067], cost time 1.0566s, every example cost time is 1.0566, generate speed: 3.7859 tokens/s, avg speed: 10.2438 tokens/s, remaining time: 0:03:53 +pred is: + ['Roman law'] + label is: + ['Terra nullius'] +The F1/Em of this example is: {'F1': 33.33333333333333, 'Em': 0.0} +2024-07-30 14:32:03,807 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:03,807 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 276, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:03,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:03,808 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:03,808 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:04,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:04,787 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:04,820 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:04,852 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:04,884 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:04,918 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:04,950 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:04,983 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:05,015 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:05,048 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:05,368 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5600152015686035 s; generated tokens: 20 tokens; generate speed: 12.820387891021763 tokens/s +2024-07-30 14:32:05,373 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:05,373 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1897/2067], cost time 1.5718s, every example cost time is 1.5718, generate speed: 12.7241 tokens/s, avg speed: 10.2453 tokens/s, remaining time: 0:03:52 +pred is: + ['1'] + label is: + ['an imaginative geography'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:32:05,456 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:05,456 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 151, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:05,456 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:05,457 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:05,457 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:06,400 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:06,433 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:06,465 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:06,497 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:06,528 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:06,559 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:06,590 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:06,621 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:06,652 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:06,684 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:06,995 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.537973165512085 s; generated tokens: 20 tokens; generate speed: 13.004128061844812 tokens/s +2024-07-30 14:32:07,000 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:07,001 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1898/2067], cost time 1.5498s, every example cost time is 1.5498, generate speed: 12.9046 tokens/s, avg speed: 10.2469 tokens/s, remaining time: 0:03:51 +pred is: + ['the role of nineteenth-century maps during the "scramble for Africa"'] + label is: + ['nineteenth-century maps'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 14:32:07,084 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:07,084 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 221, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:07,085 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:07,085 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:07,085 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:08,029 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:08,062 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:08,094 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:08,125 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:08,128 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0425217151641846 s; generated tokens: 4 tokens; generate speed: 3.836850534446708 tokens/s +2024-07-30 14:32:08,133 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:08,133 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1899/2067], cost time 1.0540s, every example cost time is 1.0540, generate speed: 3.7951 tokens/s, avg speed: 10.2442 tokens/s, remaining time: 0:03:49 +pred is: + ['1'] + label is: + ['the pre-Columbian era'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:32:08,214 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:08,215 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 255, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:08,215 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:08,215 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:08,216 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:09,160 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:09,193 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:09,224 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:09,255 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:09,286 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:09,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:09,348 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:09,379 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:09,410 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:09,443 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:09,759 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5436913967132568 s; generated tokens: 20 tokens; generate speed: 12.95595741647774 tokens/s +2024-07-30 14:32:09,764 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:09,765 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1900/2067], cost time 1.5550s, every example cost time is 1.5550, generate speed: 12.8620 tokens/s, avg speed: 10.2458 tokens/s, remaining time: 0:03:48 +pred is: + ['Cultural imperialism'] + label is: + ['Cultural imperialism'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.22311070359759, Em score: 47.578947368421055, current_count: 1900 +2024-07-30 14:32:10,418 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:10,418 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 175, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:10,419 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:10,419 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:10,419 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:11,363 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:11,396 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:11,427 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:11,458 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:11,488 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:11,519 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:11,550 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:11,581 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:11,611 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:11,642 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:11,950 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5311007499694824 s; generated tokens: 20 tokens; generate speed: 13.062497683708035 tokens/s +2024-07-30 14:32:11,955 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:11,955 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1901/2067], cost time 1.5428s, every example cost time is 1.5428, generate speed: 12.9638 tokens/s, avg speed: 10.2474 tokens/s, remaining time: 0:03:47 +pred is: + ['1700'] + label is: + ['around 1700'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:32:12,038 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:12,039 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 214, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:12,039 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:12,040 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:12,040 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:12,984 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:13,017 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:13,048 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:13,078 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:13,109 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:13,140 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:13,170 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:13,201 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:13,237 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:13,268 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:13,576 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5362730026245117 s; generated tokens: 20 tokens; generate speed: 13.018519472667126 tokens/s +2024-07-30 14:32:13,581 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:13,581 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1902/2067], cost time 1.5481s, every example cost time is 1.5481, generate speed: 12.9187 tokens/s, avg speed: 10.2490 tokens/s, remaining time: 0:03:45 +pred is: + ['1919'] + label is: + ['1919'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:32:13,663 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:13,663 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 205, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:13,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:13,664 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:13,664 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:14,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:14,641 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:14,672 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:14,703 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:14,734 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:14,765 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:14,795 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:14,826 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:14,857 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:14,888 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:15,196 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5318081378936768 s; generated tokens: 20 tokens; generate speed: 13.056465431435255 tokens/s +2024-07-30 14:32:15,201 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:15,201 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1903/2067], cost time 1.5429s, every example cost time is 1.5429, generate speed: 12.9626 tokens/s, avg speed: 10.2506 tokens/s, remaining time: 0:03:44 +pred is: + ['economic growth'] + label is: + ['economic growth'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:32:15,284 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:15,284 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 155, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:15,284 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:15,285 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:15,285 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:16,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:16,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:16,292 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:16,294 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0095057487487793 s; generated tokens: 3 tokens; generate speed: 2.971751278997982 tokens/s +2024-07-30 14:32:16,299 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:16,300 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1904/2067], cost time 1.0207s, every example cost time is 1.0207, generate speed: 2.9392 tokens/s, avg speed: 10.2477 tokens/s, remaining time: 0:03:43 +pred is: + ['Communication'] + label is: + ['communication'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:32:16,382 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:16,382 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 425, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:16,383 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:16,383 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:16,383 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:17,330 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:17,364 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:17,395 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:17,426 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:17,457 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:17,488 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:17,519 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:17,550 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:17,581 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:17,612 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:17,645 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.261709451675415 s; generated tokens: 11 tokens; generate speed: 8.718330504216464 tokens/s +2024-07-30 14:32:17,650 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:17,650 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1905/2067], cost time 1.2728s, every example cost time is 1.2728, generate speed: 8.6421 tokens/s, avg speed: 10.2470 tokens/s, remaining time: 0:03:41 +pred is: + ['British'] + label is: + ['British'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:32:17,732 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:17,732 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 246, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:17,732 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:17,732 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:17,733 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:18,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:18,709 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:18,741 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:18,780 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:18,812 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:18,843 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:18,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:18,904 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:18,935 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:18,966 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:19,091 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3579895496368408 s; generated tokens: 14 tokens; generate speed: 10.309357685222201 tokens/s +2024-07-30 14:32:19,096 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:19,096 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1906/2067], cost time 1.3692s, every example cost time is 1.3692, generate speed: 10.2251 tokens/s, avg speed: 10.2470 tokens/s, remaining time: 0:03:40 +pred is: + ['aristocracy'] + label is: + ['aristocracy'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:32:19,178 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:19,179 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:19,179 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:19,179 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:19,180 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:20,122 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:20,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:20,186 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:20,217 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:20,248 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:20,279 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:20,310 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:20,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:20,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:20,405 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:20,713 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5335495471954346 s; generated tokens: 20 tokens; generate speed: 13.041639271829286 tokens/s +2024-07-30 14:32:20,718 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:20,718 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1907/2067], cost time 1.5448s, every example cost time is 1.5448, generate speed: 12.9469 tokens/s, avg speed: 10.2486 tokens/s, remaining time: 0:03:38 +pred is: + ['Environmental determinism'] + label is: + ['environmental determinism'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:32:20,801 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:20,802 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 178, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:20,802 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:20,802 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:20,802 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:21,745 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:21,778 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:21,809 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:21,840 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:21,871 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:21,902 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:21,932 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:21,963 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:21,994 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:22,024 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:22,332 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.529567003250122 s; generated tokens: 20 tokens; generate speed: 13.075595876154962 tokens/s +2024-07-30 14:32:22,338 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:22,338 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1908/2067], cost time 1.5415s, every example cost time is 1.5415, generate speed: 12.9743 tokens/s, avg speed: 10.2502 tokens/s, remaining time: 0:03:37 +pred is: + ['Geographic scholars under colonizing empires'] + label is: + ['geographic scholars'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:32:22,421 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:22,421 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 152, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:22,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:22,421 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:22,422 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:23,364 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:23,396 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:23,427 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:23,458 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:23,489 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:23,520 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:23,550 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:23,581 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:23,612 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:23,642 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:23,950 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5279674530029297 s; generated tokens: 20 tokens; generate speed: 13.089284042466874 tokens/s +2024-07-30 14:32:23,955 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:23,955 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1909/2067], cost time 1.5391s, every example cost time is 1.5391, generate speed: 12.9943 tokens/s, avg speed: 10.2518 tokens/s, remaining time: 0:03:36 +pred is: + ['1599'] + label is: + ['the sixteenth century'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:32:24,037 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:24,037 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 176, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:24,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:24,038 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:24,038 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:24,981 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:25,014 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:25,045 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:25,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:25,106 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:25,137 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:25,168 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:25,198 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:25,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:25,259 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:25,292 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2537543773651123 s; generated tokens: 11 tokens; generate speed: 8.773648330638396 tokens/s +2024-07-30 14:32:25,297 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:25,297 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1910/2067], cost time 1.2648s, every example cost time is 1.2648, generate speed: 8.6970 tokens/s, avg speed: 10.2510 tokens/s, remaining time: 0:03:34 +pred is: + ['1830'] + label is: + ['1830'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.316183422426924, Em score: 47.696335078534034, current_count: 1910 +2024-07-30 14:32:25,955 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:25,955 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:25,956 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:25,956 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:25,956 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:26,899 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:26,934 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:26,967 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:26,999 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:27,031 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:27,062 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:27,093 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:27,124 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:27,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:27,186 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:27,496 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5402228832244873 s; generated tokens: 20 tokens; generate speed: 12.985133656844262 tokens/s +2024-07-30 14:32:27,501 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:27,502 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1911/2067], cost time 1.5519s, every example cost time is 1.5519, generate speed: 12.8872 tokens/s, avg speed: 10.2526 tokens/s, remaining time: 0:03:33 +pred is: + ['civilize the inferior'] + label is: + ['civilize the inferior'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:32:27,584 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:27,584 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 203, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:27,585 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:27,585 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:27,585 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:28,529 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:28,562 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:28,592 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:28,623 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:28,654 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:28,685 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:28,716 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:28,747 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:28,777 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:28,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:29,116 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5307714939117432 s; generated tokens: 20 tokens; generate speed: 13.065307316960727 tokens/s +2024-07-30 14:32:29,121 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:29,121 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1912/2067], cost time 1.5420s, every example cost time is 1.5420, generate speed: 12.9706 tokens/s, avg speed: 10.2542 tokens/s, remaining time: 0:03:32 +pred is: + ['1'] + label is: + ['overseas colonies'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:32:29,204 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:29,204 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 229, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:29,204 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:29,204 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:29,205 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:30,148 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:30,182 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:30,213 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:30,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:30,274 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:30,306 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:30,337 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:30,368 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:30,399 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:30,430 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:30,525 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.320204734802246 s; generated tokens: 13 tokens; generate speed: 9.84695756446236 tokens/s +2024-07-30 14:32:30,530 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:30,530 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1913/2067], cost time 1.3315s, every example cost time is 1.3315, generate speed: 9.7632 tokens/s, avg speed: 10.2539 tokens/s, remaining time: 0:03:30 +pred is: + ['Scandinavia and northern Europe'] + label is: + ['Scandinavia'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 14:32:30,612 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:30,613 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 257, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:30,613 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:30,613 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:30,613 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:31,557 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:31,591 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:31,622 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:31,653 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:31,684 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:31,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:31,746 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:31,776 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:31,807 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:31,838 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:31,903 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2891497611999512 s; generated tokens: 12 tokens; generate speed: 9.308460786456882 tokens/s +2024-07-30 14:32:31,908 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:31,908 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1914/2067], cost time 1.3005s, every example cost time is 1.3005, generate speed: 9.2276 tokens/s, avg speed: 10.2534 tokens/s, remaining time: 0:03:29 +pred is: + ['19th century'] + label is: + ['late 19th century'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:32:31,990 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:31,991 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 150, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:31,991 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:31,991 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:31,991 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:32,935 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:32,968 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:32,999 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:33,030 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:33,061 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:33,092 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:33,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:33,154 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:33,184 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:33,215 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:33,534 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5423521995544434 s; generated tokens: 20 tokens; generate speed: 12.96720684534805 tokens/s +2024-07-30 14:32:33,539 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:33,539 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1915/2067], cost time 1.5538s, every example cost time is 1.5538, generate speed: 12.8719 tokens/s, avg speed: 10.2550 tokens/s, remaining time: 0:03:28 +pred is: + ['1'] + label is: + ['the South Pacific'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:32:33,622 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:33,622 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 286, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:33,622 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:33,622 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:33,623 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:34,567 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:34,601 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:34,632 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:34,663 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:34,694 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:34,724 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:34,755 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:34,786 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:34,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:34,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:34,942 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3194770812988281 s; generated tokens: 13 tokens; generate speed: 9.85238787717589 tokens/s +2024-07-30 14:32:34,947 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:34,947 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1916/2067], cost time 1.3307s, every example cost time is 1.3307, generate speed: 9.7694 tokens/s, avg speed: 10.2547 tokens/s, remaining time: 0:03:26 +pred is: + ['Japan took part of Sakhalin Island from Russia.'] + label is: + ['Japan took part of Sakhalin Island'] +The F1/Em of this example is: {'F1': 81.48148148148148, 'Em': 0.0} +2024-07-30 14:32:35,030 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:35,030 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 226, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:35,030 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:35,031 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:35,031 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:35,974 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:36,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:36,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:36,068 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:36,099 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:36,130 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:36,160 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:36,191 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:36,222 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:36,252 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:36,562 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5313215255737305 s; generated tokens: 20 tokens; generate speed: 13.06061442093732 tokens/s +2024-07-30 14:32:36,567 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:36,567 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1917/2067], cost time 1.5425s, every example cost time is 1.5425, generate speed: 12.9657 tokens/s, avg speed: 10.2563 tokens/s, remaining time: 0:03:25 +pred is: + ['1'] + label is: + ['China'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:32:36,649 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:36,650 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 417, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:36,650 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:36,650 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:36,651 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:37,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:37,631 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:37,662 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:37,693 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:37,724 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:37,755 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:37,786 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:37,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:37,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:37,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:38,189 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5381691455841064 s; generated tokens: 20 tokens; generate speed: 13.002471189477133 tokens/s +2024-07-30 14:32:38,194 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:38,194 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1918/2067], cost time 1.5495s, every example cost time is 1.5495, generate speed: 12.9070 tokens/s, avg speed: 10.2579 tokens/s, remaining time: 0:03:23 +pred is: + ['Trotsky thought that the revolution could only succeed in Russia as part of a world revolution.'] + label is: + ['a world revolution'] +The F1/Em of this example is: {'F1': 27.027027027027028, 'Em': 0.0} +2024-07-30 14:32:38,277 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:38,277 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 236, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:38,278 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:38,278 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:38,278 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:39,222 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:39,254 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:39,285 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:39,316 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:39,347 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:39,378 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:39,409 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:39,440 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:39,476 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:39,507 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:39,823 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5443141460418701 s; generated tokens: 20 tokens; generate speed: 12.950732887645097 tokens/s +2024-07-30 14:32:39,828 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:39,828 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1919/2067], cost time 1.5556s, every example cost time is 1.5556, generate speed: 12.8567 tokens/s, avg speed: 10.2594 tokens/s, remaining time: 0:03:22 +pred is: + ['mercantilism'] + label is: + ['mercantilism'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:32:39,910 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:39,911 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 198, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:39,912 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:39,913 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:39,913 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:40,857 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:40,891 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:40,922 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:40,925 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0122735500335693 s; generated tokens: 3 tokens; generate speed: 2.9636257905785577 tokens/s +2024-07-30 14:32:40,930 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:40,931 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1920/2067], cost time 1.0251s, every example cost time is 1.0251, generate speed: 2.9264 tokens/s, avg speed: 10.2566 tokens/s, remaining time: 0:03:21 +pred is: + ['Britain'] + label is: + ['The British Empire'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 62.2043848152833, Em score: 47.552083333333336, current_count: 1920 +2024-07-30 14:32:41,583 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:41,583 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 297, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:41,584 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:41,584 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:41,584 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:42,530 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:42,563 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:42,594 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:42,625 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:42,656 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:42,687 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:42,717 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:42,748 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:42,780 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:42,811 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:43,125 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5402882099151611 s; generated tokens: 20 tokens; generate speed: 12.984582931464233 tokens/s +2024-07-30 14:32:43,130 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:43,130 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1921/2067], cost time 1.5521s, every example cost time is 1.5521, generate speed: 12.8856 tokens/s, avg speed: 10.2581 tokens/s, remaining time: 0:03:19 +pred is: + ['The United States planned to subdue imperialistic tendencies by creating the Anti-Imperialist League'] + label is: + ['the Monroe Doctrine'] +The F1/Em of this example is: {'F1': 13.333333333333334, 'Em': 0.0} +2024-07-30 14:32:43,214 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:43,214 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 194, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:43,214 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:43,215 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:43,215 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:44,158 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:44,191 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:44,222 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:44,253 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:44,284 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:44,314 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:44,345 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:44,376 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:44,406 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:44,437 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:44,745 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.529578447341919 s; generated tokens: 20 tokens; generate speed: 13.075498046377245 tokens/s +2024-07-30 14:32:44,749 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:44,750 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1922/2067], cost time 1.5409s, every example cost time is 1.5409, generate speed: 12.9797 tokens/s, avg speed: 10.2597 tokens/s, remaining time: 0:03:18 +pred is: + ['Isiah Bowman'] + label is: + ['Isiah Bowman'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:32:44,832 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:44,833 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 327, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:44,833 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:44,833 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:44,833 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:45,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:45,812 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:45,844 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:45,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:45,905 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:45,937 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:45,968 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:45,999 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:46,030 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:46,033 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.19907808303833 s; generated tokens: 9 tokens; generate speed: 7.5057664111373 tokens/s +2024-07-30 14:32:46,038 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:46,038 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1923/2067], cost time 1.2103s, every example cost time is 1.2103, generate speed: 7.4361 tokens/s, avg speed: 10.2584 tokens/s, remaining time: 0:03:17 +pred is: + ['internal'] + label is: + ['internal strife'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:32:46,120 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:46,120 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 172, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:46,121 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:46,121 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:46,121 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:47,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:47,097 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:47,128 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:47,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:47,162 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0406877994537354 s; generated tokens: 4 tokens; generate speed: 3.8436118902322383 tokens/s +2024-07-30 14:32:47,167 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:47,167 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1924/2067], cost time 1.0518s, every example cost time is 1.0518, generate speed: 3.8030 tokens/s, avg speed: 10.2558 tokens/s, remaining time: 0:03:15 +pred is: + ['1923'] + label is: + ['1923'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:32:47,248 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:47,249 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 174, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:47,249 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:47,249 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:47,249 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:48,192 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:48,225 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:48,256 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:48,286 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:48,317 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:48,354 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:48,386 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:48,417 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:48,447 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:48,478 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:48,605 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3552298545837402 s; generated tokens: 14 tokens; generate speed: 10.33035093836544 tokens/s +2024-07-30 14:32:48,610 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:48,610 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1925/2067], cost time 1.3665s, every example cost time is 1.3665, generate speed: 10.2451 tokens/s, avg speed: 10.2558 tokens/s, remaining time: 0:03:14 +pred is: + ['Istanbul'] + label is: + ['Istanbul'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:32:48,692 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:48,692 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 153, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:48,693 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:48,693 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:48,693 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:49,636 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:49,669 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:49,703 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:49,734 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:49,764 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:49,796 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:49,827 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:49,858 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:49,889 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:49,920 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:50,230 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5370659828186035 s; generated tokens: 20 tokens; generate speed: 13.011803151953755 tokens/s +2024-07-30 14:32:50,235 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:50,235 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1926/2067], cost time 1.5483s, every example cost time is 1.5483, generate speed: 12.9174 tokens/s, avg speed: 10.2574 tokens/s, remaining time: 0:03:13 +pred is: + ['United Methodist Church'] + label is: + ['United Methodist Church'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:32:50,318 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:50,318 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 215, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:50,319 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:50,319 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:50,319 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:51,263 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:51,296 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:51,327 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:51,358 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:51,389 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:51,420 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:51,451 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:51,483 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:51,515 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:51,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:51,854 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5344674587249756 s; generated tokens: 20 tokens; generate speed: 13.033837821897157 tokens/s +2024-07-30 14:32:51,859 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:51,859 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1927/2067], cost time 1.5458s, every example cost time is 1.5458, generate speed: 12.9382 tokens/s, avg speed: 10.2590 tokens/s, remaining time: 0:03:11 +pred is: + ['80 million'] + label is: + ['United Methodist Church'] +The F1/Em of this example is: {'F1': 25.0, 'Em': 0.0} +2024-07-30 14:32:51,941 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:51,941 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 178, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:51,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:51,942 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:51,942 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:52,886 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:52,919 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:52,950 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:52,981 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:53,011 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:53,042 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:53,072 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:53,103 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:53,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:53,165 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:53,474 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5313568115234375 s; generated tokens: 20 tokens; generate speed: 13.060313474626092 tokens/s +2024-07-30 14:32:53,479 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:53,479 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1928/2067], cost time 1.5426s, every example cost time is 1.5426, generate speed: 12.9652 tokens/s, avg speed: 10.2606 tokens/s, remaining time: 0:03:10 +pred is: + ['mid-18th century'] + label is: + ['mid-18th century'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:32:53,561 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:53,561 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 210, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:53,562 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:53,562 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:53,562 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:54,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:54,538 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:54,569 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:54,600 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:54,630 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:54,661 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:54,692 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:54,723 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:54,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:54,784 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:54,969 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4073026180267334 s; generated tokens: 16 tokens; generate speed: 11.369267558412274 tokens/s +2024-07-30 14:32:54,974 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:54,974 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1929/2067], cost time 1.4184s, every example cost time is 1.4184, generate speed: 11.2804 tokens/s, avg speed: 10.2611 tokens/s, remaining time: 0:03:08 +pred is: + ['1735'] + label is: + ['1735'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:32:55,056 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:55,056 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 199, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:55,057 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:55,057 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:55,057 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:56,001 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:56,033 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:56,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:56,095 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:56,125 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:56,156 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:56,187 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:56,218 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:56,248 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:56,279 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:56,282 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2245941162109375 s; generated tokens: 10 tokens; generate speed: 8.165970967540963 tokens/s +2024-07-30 14:32:56,287 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:56,287 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1930/2067], cost time 1.2356s, every example cost time is 1.2356, generate speed: 8.0929 tokens/s, avg speed: 10.2601 tokens/s, remaining time: 0:03:07 +pred is: + ['The American Revolution'] + label is: + ['American Revolution'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +F1 score: 62.27759180242346, Em score: 47.61658031088083, current_count: 1930 +2024-07-30 14:32:56,944 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:56,944 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:56,945 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:56,945 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:56,945 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:57,889 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:57,922 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:57,953 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:57,984 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:58,015 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:58,046 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:58,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:58,107 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:58,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:58,168 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:58,476 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5302150249481201 s; generated tokens: 20 tokens; generate speed: 13.070058569499455 tokens/s +2024-07-30 14:32:58,481 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:58,482 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1931/2067], cost time 1.5426s, every example cost time is 1.5426, generate speed: 12.9649 tokens/s, avg speed: 10.2617 tokens/s, remaining time: 0:03:06 +pred is: + ["St. George's United Methodist Church"] + label is: + ["St. George's United Methodist Church"] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:32:58,564 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:58,565 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 204, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:58,565 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:58,565 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:58,565 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:32:59,509 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:59,542 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:59,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:59,609 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:59,640 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:59,671 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:59,702 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:59,733 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:59,735 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1697511672973633 s; generated tokens: 8 tokens; generate speed: 6.839061352239125 tokens/s +2024-07-30 14:32:59,740 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:32:59,740 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1932/2067], cost time 1.1808s, every example cost time is 1.1808, generate speed: 6.7748 tokens/s, avg speed: 10.2601 tokens/s, remaining time: 0:03:04 +pred is: + ['Richard Allen and Absalom Jones'] + label is: + ['Richard Allen and Absalom Jones'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:32:59,823 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:32:59,823 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:32:59,824 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:32:59,824 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:32:59,824 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:00,767 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:00,800 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:00,831 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:00,862 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:00,893 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:00,924 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:00,954 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:00,985 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:01,016 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:01,046 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:01,049 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2243242263793945 s; generated tokens: 10 tokens; generate speed: 8.167771072840955 tokens/s +2024-07-30 14:33:01,053 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:01,054 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1933/2067], cost time 1.2355s, every example cost time is 1.2355, generate speed: 8.0939 tokens/s, avg speed: 10.2591 tokens/s, remaining time: 0:03:03 +pred is: + ['1830'] + label is: + ['1830'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:33:01,136 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:01,136 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 158, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:01,136 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:01,137 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:01,137 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:02,080 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:02,113 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:02,144 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:02,174 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:02,177 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0402729511260986 s; generated tokens: 4 tokens; generate speed: 3.8451446763755492 tokens/s +2024-07-30 14:33:02,182 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:02,182 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1934/2067], cost time 1.0515s, every example cost time is 1.0515, generate speed: 3.8040 tokens/s, avg speed: 10.2565 tokens/s, remaining time: 0:03:02 +pred is: + ['1968'] + label is: + ['April 23, 1968'] +The F1/Em of this example is: {'F1': 28.57142857142857, 'Em': 0.0} +2024-07-30 14:33:02,264 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:02,264 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 193, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:02,264 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:02,264 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:02,265 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:03,208 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:03,241 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:03,272 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:03,303 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:03,333 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:03,364 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:03,395 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:03,426 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:03,457 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:03,488 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:03,797 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.532064437866211 s; generated tokens: 20 tokens; generate speed: 13.054281207554874 tokens/s +2024-07-30 14:33:03,802 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:03,802 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1935/2067], cost time 1.5433s, every example cost time is 1.5433, generate speed: 12.9596 tokens/s, avg speed: 10.2581 tokens/s, remaining time: 0:03:00 +pred is: + ['the holy catholic (or universal) church'] + label is: + ['holy catholic (or universal) church'] +The F1/Em of this example is: {'F1': 91.66666666666666, 'Em': 0.0} +2024-07-30 14:33:03,885 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:03,886 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 278, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:03,886 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:03,886 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:03,886 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:04,831 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:04,864 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:04,896 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:04,926 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:04,957 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:04,987 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:05,018 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:05,049 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:05,080 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:05,111 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:05,418 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.531864881515503 s; generated tokens: 20 tokens; generate speed: 13.055981791431645 tokens/s +2024-07-30 14:33:05,423 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:05,424 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1936/2067], cost time 1.5430s, every example cost time is 1.5430, generate speed: 12.9615 tokens/s, avg speed: 10.2597 tokens/s, remaining time: 0:02:59 +pred is: + ['He was compelled to break with standard practice and ordain two of his lay preachers as pres'] + label is: + ['result of the American Revolution'] +The F1/Em of this example is: {'F1': 14.285714285714288, 'Em': 0.0} +2024-07-30 14:33:05,507 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:05,507 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 187, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:05,507 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:05,508 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:05,508 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:06,451 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:06,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:06,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:06,546 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:06,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:06,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:06,639 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:06,669 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:06,700 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:06,731 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:07,009 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5011563301086426 s; generated tokens: 19 tokens; generate speed: 12.656909622880464 tokens/s +2024-07-30 14:33:07,014 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:07,014 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1937/2067], cost time 1.5123s, every example cost time is 1.5123, generate speed: 12.5633 tokens/s, avg speed: 10.2610 tokens/s, remaining time: 0:02:57 +pred is: + ['1968'] + label is: + ['1968'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:33:07,096 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:07,097 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:07,097 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:07,097 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:07,097 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:08,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:08,073 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:08,104 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:08,135 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:08,166 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:08,168 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.07076096534729 s; generated tokens: 5 tokens; generate speed: 4.669576275016995 tokens/s +2024-07-30 14:33:08,173 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:08,173 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1938/2067], cost time 1.0818s, every example cost time is 1.0818, generate speed: 4.6217 tokens/s, avg speed: 10.2587 tokens/s, remaining time: 0:02:56 +pred is: + ['Prevenient grace'] + label is: + ['Prevenient grace'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:33:08,256 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:08,256 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 227, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:08,256 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:08,257 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:08,257 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:09,200 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:09,233 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:09,264 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:09,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:09,326 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:09,329 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0720970630645752 s; generated tokens: 5 tokens; generate speed: 4.663756829729173 tokens/s +2024-07-30 14:33:09,334 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:09,334 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1939/2067], cost time 1.0833s, every example cost time is 1.0833, generate speed: 4.6156 tokens/s, avg speed: 10.2564 tokens/s, remaining time: 0:02:55 +pred is: + ['Justifying Grace'] + label is: + ['Justifying Grace or Accepting Grace'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:33:09,417 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:09,417 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 187, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:09,418 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:09,418 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:09,418 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:10,362 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:10,395 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:10,426 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:10,457 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:10,487 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:10,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:10,549 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:10,580 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:10,611 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:10,643 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:10,956 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5377156734466553 s; generated tokens: 20 tokens; generate speed: 13.006305616415906 tokens/s +2024-07-30 14:33:10,961 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:10,961 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1940/2067], cost time 1.5494s, every example cost time is 1.5494, generate speed: 12.9085 tokens/s, avg speed: 10.2579 tokens/s, remaining time: 0:02:53 +pred is: + ['Sanctifying Grace is that grace of God which sustains the believers in the journey toward Christian'] + label is: + ['grace of God which sustains the believers in the journey toward Christian Perfection'] +The F1/Em of this example is: {'F1': 82.14285714285714, 'Em': 0.0} +F1 score: 62.35176229141441, Em score: 47.628865979381445, current_count: 1940 +2024-07-30 14:33:11,624 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:11,625 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 350, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:11,625 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:11,625 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:11,625 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:12,572 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:12,605 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:12,637 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:12,668 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:12,698 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:12,729 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:12,760 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:12,763 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1374332904815674 s; generated tokens: 7 tokens; generate speed: 6.154207071815469 tokens/s +2024-07-30 14:33:12,768 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:12,768 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1941/2067], cost time 1.1490s, every example cost time is 1.1490, generate speed: 6.0925 tokens/s, avg speed: 10.2561 tokens/s, remaining time: 0:02:52 +pred is: + ['Wesleyan theology'] + label is: + ['Wesleyan theology'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:33:12,850 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:12,850 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 204, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:12,851 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:12,851 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:12,851 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:13,795 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:13,828 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:13,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:13,890 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:13,921 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:13,952 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:13,982 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:14,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:14,045 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:14,079 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:14,144 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.292480230331421 s; generated tokens: 12 tokens; generate speed: 9.284474700957654 tokens/s +2024-07-30 14:33:14,149 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:14,149 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1942/2067], cost time 1.3037s, every example cost time is 1.3037, generate speed: 9.2047 tokens/s, avg speed: 10.2556 tokens/s, remaining time: 0:02:51 +pred is: + ['2008'] + label is: + ['2008'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:33:14,231 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:14,231 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 205, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:14,232 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:14,232 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:14,232 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:15,176 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:15,210 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:15,241 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:15,272 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:15,303 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:15,334 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:15,365 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:15,395 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:15,427 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:15,458 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:15,800 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5674481391906738 s; generated tokens: 20 tokens; generate speed: 12.75959280562014 tokens/s +2024-07-30 14:33:15,805 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:15,805 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1943/2067], cost time 1.5789s, every example cost time is 1.5789, generate speed: 12.6668 tokens/s, avg speed: 10.2571 tokens/s, remaining time: 0:02:49 +pred is: + ['The General Board of Church and Society, and the United Methodist Women'] + label is: + ['The General Board of Church and Society, and the United Methodist Women'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:33:15,889 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:15,889 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 193, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:15,890 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:15,890 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:15,890 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:16,834 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:16,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:16,899 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:16,930 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:16,962 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:16,993 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:17,024 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:17,055 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:17,087 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:17,118 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:17,429 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.538895606994629 s; generated tokens: 20 tokens; generate speed: 12.996333155475572 tokens/s +2024-07-30 14:33:17,434 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:17,434 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1944/2067], cost time 1.5503s, every example cost time is 1.5503, generate speed: 12.9004 tokens/s, avg speed: 10.2586 tokens/s, remaining time: 0:02:48 +pred is: + ['TUMAS'] + label is: + ['Taskforce of United Methodists on Abortion and Sexuality ('] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:33:17,517 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:17,517 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 236, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:17,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:17,518 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:17,518 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:18,462 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:18,496 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:18,528 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:18,559 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:18,591 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:18,622 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:18,653 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:18,684 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:18,715 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:18,746 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:19,077 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5585367679595947 s; generated tokens: 20 tokens; generate speed: 12.832549357294663 tokens/s +2024-07-30 14:33:19,082 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:19,082 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1945/2067], cost time 1.5698s, every example cost time is 1.5698, generate speed: 12.7407 tokens/s, avg speed: 10.2601 tokens/s, remaining time: 0:02:47 +pred is: + ['temperance'] + label is: + ['temperance movement'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:33:19,164 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:19,164 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 192, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:19,165 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:19,165 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:19,165 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:20,109 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:20,142 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:20,174 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:20,205 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:20,236 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:20,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:20,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:20,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:20,360 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:20,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:20,424 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2583796977996826 s; generated tokens: 11 tokens; generate speed: 8.741399769269842 tokens/s +2024-07-30 14:33:20,429 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:20,429 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1946/2067], cost time 1.2695s, every example cost time is 1.2695, generate speed: 8.6648 tokens/s, avg speed: 10.2593 tokens/s, remaining time: 0:02:45 +pred is: + ['capital punishment'] + label is: + ['capital punishment'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:33:20,511 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:20,511 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 249, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:20,512 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:20,512 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:20,512 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:21,456 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:21,491 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:21,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:21,553 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:21,584 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:21,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:21,646 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:21,677 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:21,708 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:21,738 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:22,046 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5338644981384277 s; generated tokens: 20 tokens; generate speed: 13.038961410393792 tokens/s +2024-07-30 14:33:22,051 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:22,051 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1947/2067], cost time 1.5450s, every example cost time is 1.5450, generate speed: 12.9447 tokens/s, avg speed: 10.2609 tokens/s, remaining time: 0:02:44 +pred is: + ['1'] + label is: + ['same-sex unions'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:33:22,132 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:22,133 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 208, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:22,133 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:22,133 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:22,133 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:23,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:23,109 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:23,140 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:23,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:23,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:23,233 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:23,264 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:23,295 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:23,325 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:23,356 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:23,685 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.551208734512329 s; generated tokens: 20 tokens; generate speed: 12.893171341178416 tokens/s +2024-07-30 14:33:23,690 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:23,690 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1948/2067], cost time 1.5624s, every example cost time is 1.5624, generate speed: 12.8005 tokens/s, avg speed: 10.2623 tokens/s, remaining time: 0:02:42 +pred is: + ['Connectional Table'] + label is: + ['Connectional Table'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:33:23,773 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:23,773 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 265, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:23,774 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:23,774 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:23,774 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:24,719 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:24,752 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:24,783 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:24,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:24,845 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:24,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:24,908 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:24,938 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:24,969 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:24,999 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:25,277 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5025691986083984 s; generated tokens: 19 tokens; generate speed: 12.645008308167647 tokens/s +2024-07-30 14:33:25,282 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:25,282 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1949/2067], cost time 1.5138s, every example cost time is 1.5138, generate speed: 12.5512 tokens/s, avg speed: 10.2636 tokens/s, remaining time: 0:02:41 +pred is: + ['1987'] + label is: + ['1987'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:33:25,363 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:25,364 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 173, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:25,364 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:25,364 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:25,364 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:26,308 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:26,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:26,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:26,403 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:26,433 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:26,488 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:26,520 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:26,551 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:26,582 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:26,612 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:26,921 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.556682825088501 s; generated tokens: 20 tokens; generate speed: 12.84783237642707 tokens/s +2024-07-30 14:33:26,926 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:26,926 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1950/2067], cost time 1.5678s, every example cost time is 1.5678, generate speed: 12.7564 tokens/s, avg speed: 10.2651 tokens/s, remaining time: 0:02:40 +pred is: + ['Conscription'] + label is: + ['conscription'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.41662504889434, Em score: 47.743589743589745, current_count: 1950 +2024-07-30 14:33:27,598 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:27,598 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 211, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:27,599 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:27,599 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:27,599 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:28,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:28,575 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:28,607 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:28,638 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:28,668 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:28,699 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:28,730 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:28,761 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:28,792 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:28,822 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:28,916 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3171210289001465 s; generated tokens: 13 tokens; generate speed: 9.870011726147572 tokens/s +2024-07-30 14:33:28,921 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:28,921 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1951/2067], cost time 1.3288s, every example cost time is 1.3288, generate speed: 9.7834 tokens/s, avg speed: 10.2649 tokens/s, remaining time: 0:02:38 +pred is: + ["Christ's message and teachings"] + label is: + ["Christ's message and teachings"] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:33:29,004 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:29,004 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 155, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:29,005 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:29,005 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:29,005 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:29,948 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:29,981 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:30,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:30,045 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:30,077 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:30,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:30,139 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:30,170 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:30,201 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:30,232 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:30,545 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5390396118164062 s; generated tokens: 20 tokens; generate speed: 12.995117114884124 tokens/s +2024-07-30 14:33:30,549 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:30,550 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1952/2067], cost time 1.5503s, every example cost time is 1.5503, generate speed: 12.9006 tokens/s, avg speed: 10.2664 tokens/s, remaining time: 0:02:37 +pred is: + ['The Sexual Ethics Task Force of The United Methodist Church'] + label is: + ['The Sexual Ethics Task Force of The United Methodist Church'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:33:30,633 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:30,633 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 174, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:30,634 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:30,634 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:30,634 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:31,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:31,611 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:31,642 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:31,673 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:31,703 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:31,734 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:31,781 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:31,812 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:31,842 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:31,873 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:31,937 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.303037166595459 s; generated tokens: 12 tokens; generate speed: 9.209253816875602 tokens/s +2024-07-30 14:33:31,942 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:31,942 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1953/2067], cost time 1.3142s, every example cost time is 1.3142, generate speed: 9.1308 tokens/s, avg speed: 10.2658 tokens/s, remaining time: 0:02:36 +pred is: + ['IVF'] + label is: + ['IVF'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:33:32,025 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:32,025 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:32,025 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:32,026 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:32,026 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:32,968 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:33,001 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:33,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:33,063 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:33,119 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:33,151 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:33,182 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:33,213 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:33,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:33,274 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:33,308 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2818851470947266 s; generated tokens: 11 tokens; generate speed: 8.581111985680213 tokens/s +2024-07-30 14:33:33,313 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:33,313 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1954/2067], cost time 1.2931s, every example cost time is 1.2931, generate speed: 8.5069 tokens/s, avg speed: 10.2650 tokens/s, remaining time: 0:02:34 +pred is: + ['Sunday Service of the Methodists in North America'] + label is: + ['Sunday Service of the Methodists in North America'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:33:33,396 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:33,396 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 244, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:33,396 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:33,396 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:33,397 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:34,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:34,374 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:34,405 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:34,408 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0114240646362305 s; generated tokens: 3 tokens; generate speed: 2.9661149115321694 tokens/s +2024-07-30 14:33:34,413 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:34,413 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1955/2067], cost time 1.0226s, every example cost time is 1.0226, generate speed: 2.9337 tokens/s, avg speed: 10.2622 tokens/s, remaining time: 0:02:33 +pred is: + ['Africa'] + label is: + ['Africa'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:33:34,495 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:34,495 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 178, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:34,495 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:34,496 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:34,496 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:35,438 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:35,471 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:35,502 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:35,533 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:35,564 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:35,594 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:35,625 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:35,656 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:35,687 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:35,718 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:36,026 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.53033447265625 s; generated tokens: 20 tokens; generate speed: 13.069038407849082 tokens/s +2024-07-30 14:33:36,031 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:36,031 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1956/2067], cost time 1.5416s, every example cost time is 1.5416, generate speed: 12.9732 tokens/s, avg speed: 10.2637 tokens/s, remaining time: 0:02:31 +pred is: + ['Methodist institutions may be named after a biblical figure (e.g., "St. James U'] + label is: + ['Methodist institutions'] +The F1/Em of this example is: {'F1': 17.142857142857142, 'Em': 0.0} +2024-07-30 14:33:36,114 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:36,114 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 232, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:36,115 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:36,115 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:36,115 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:37,060 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:37,093 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:37,124 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:37,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:37,186 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:37,217 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:37,248 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:37,279 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:37,310 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:37,340 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:37,374 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.258829116821289 s; generated tokens: 11 tokens; generate speed: 8.73827897131619 tokens/s +2024-07-30 14:33:37,379 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:37,379 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1957/2067], cost time 1.2700s, every example cost time is 1.2700, generate speed: 8.6615 tokens/s, avg speed: 10.2630 tokens/s, remaining time: 0:02:30 +pred is: + ['United Methodist Church'] + label is: + ['United Methodist Church'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:33:37,462 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:37,462 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 165, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:37,462 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:37,462 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:37,463 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:38,405 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:38,438 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:38,469 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:38,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:38,531 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:38,562 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:38,592 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:38,623 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:38,626 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.162851333618164 s; generated tokens: 8 tokens; generate speed: 6.879641247955858 tokens/s +2024-07-30 14:33:38,630 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:38,631 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1958/2067], cost time 1.1740s, every example cost time is 1.1740, generate speed: 6.8145 tokens/s, avg speed: 10.2615 tokens/s, remaining time: 0:02:29 +pred is: + ['5'] + label is: + ['five'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:33:38,741 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:38,742 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 189, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:38,742 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:38,742 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:38,743 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:39,686 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:39,723 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:39,754 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:39,786 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:39,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:39,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:39,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:39,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:39,941 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:39,944 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2008726596832275 s; generated tokens: 9 tokens; generate speed: 7.494549840425268 tokens/s +2024-07-30 14:33:39,948 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:39,949 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1959/2067], cost time 1.2125s, every example cost time is 1.2125, generate speed: 7.4229 tokens/s, avg speed: 10.2602 tokens/s, remaining time: 0:02:27 +pred is: + ['Mission Council'] + label is: + ['Mission Council'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:33:40,031 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:40,031 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 221, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:40,032 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:40,032 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:40,032 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:40,976 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:41,009 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:41,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:41,071 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:41,102 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:41,133 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:41,165 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:41,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:41,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:41,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:41,261 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.228832721710205 s; generated tokens: 10 tokens; generate speed: 8.137804131780188 tokens/s +2024-07-30 14:33:41,266 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:41,266 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1960/2067], cost time 1.2400s, every example cost time is 1.2400, generate speed: 8.0645 tokens/s, avg speed: 10.2592 tokens/s, remaining time: 0:02:26 +pred is: + ['9'] + label is: + ['nine'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 62.46406209310552, Em score: 47.857142857142854, current_count: 1960 +2024-07-30 14:33:41,933 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:41,933 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 197, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:41,934 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:41,934 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:41,934 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:42,877 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:42,931 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:42,963 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:42,994 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:43,024 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:43,027 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0928599834442139 s; generated tokens: 5 tokens; generate speed: 4.575151506821761 tokens/s +2024-07-30 14:33:43,032 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:43,032 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1961/2067], cost time 1.1042s, every example cost time is 1.1042, generate speed: 4.5281 tokens/s, avg speed: 10.2568 tokens/s, remaining time: 0:02:25 +pred is: + ['The Annual Conference'] + label is: + ['The Annual Conference'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:33:43,115 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:43,115 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:43,115 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:43,116 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:43,116 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:44,059 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:44,093 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:44,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:44,155 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:44,185 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:44,216 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:44,219 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1031229496002197 s; generated tokens: 6 tokens; generate speed: 5.4391035941863475 tokens/s +2024-07-30 14:33:44,224 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:44,224 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1962/2067], cost time 1.1143s, every example cost time is 1.1143, generate speed: 5.3845 tokens/s, avg speed: 10.2548 tokens/s, remaining time: 0:02:23 +pred is: + ['The Book of Discipline'] + label is: + ['The Book of Discipline'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:33:44,307 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:44,307 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 158, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:44,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:44,308 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:44,308 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:45,250 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:45,283 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:45,314 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:45,345 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:45,376 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:45,407 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:45,438 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:45,470 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:45,472 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1643092632293701 s; generated tokens: 8 tokens; generate speed: 6.871026670191485 tokens/s +2024-07-30 14:33:45,477 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:45,477 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1963/2067], cost time 1.1755s, every example cost time is 1.1755, generate speed: 6.8058 tokens/s, avg speed: 10.2533 tokens/s, remaining time: 0:02:22 +pred is: + ['100'] + label is: + ['one hundred'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:33:45,560 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:45,560 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 245, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:45,561 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:45,561 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:45,561 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:46,506 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:46,539 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:46,570 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:46,602 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:46,633 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:46,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:46,695 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:46,726 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:46,757 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:46,787 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:46,821 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2595126628875732 s; generated tokens: 11 tokens; generate speed: 8.733536648040738 tokens/s +2024-07-30 14:33:46,826 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:46,826 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1964/2067], cost time 1.2711s, every example cost time is 1.2711, generate speed: 8.6540 tokens/s, avg speed: 10.2525 tokens/s, remaining time: 0:02:20 +pred is: + ['John Wesley'] + label is: + ['John Wesley'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:33:46,909 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:46,909 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 214, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:46,909 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:46,910 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:46,910 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:47,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:47,887 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:47,918 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:47,949 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:47,980 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:48,011 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:48,014 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1037273406982422 s; generated tokens: 6 tokens; generate speed: 5.436125190306755 tokens/s +2024-07-30 14:33:48,019 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:48,019 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1965/2067], cost time 1.1152s, every example cost time is 1.1152, generate speed: 5.3800 tokens/s, avg speed: 10.2505 tokens/s, remaining time: 0:02:19 +pred is: + ['The Annual Conference Cabinet'] + label is: + ['Annual Conference Cabinet'] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +2024-07-30 14:33:48,101 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:48,101 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 195, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:48,102 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:48,102 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:48,102 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:49,046 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:49,079 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:49,110 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:49,142 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:49,173 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:49,205 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:49,237 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:49,270 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:49,302 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:49,334 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:49,338 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2355568408966064 s; generated tokens: 10 tokens; generate speed: 8.09351676021906 tokens/s +2024-07-30 14:33:49,343 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:49,343 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1966/2067], cost time 1.2469s, every example cost time is 1.2469, generate speed: 8.0201 tokens/s, avg speed: 10.2495 tokens/s, remaining time: 0:02:18 +pred is: + ['Elders'] + label is: + ['Elders'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:33:49,427 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:49,428 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 202, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:49,428 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:49,428 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:49,428 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:50,372 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:50,405 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:50,436 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:50,467 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:50,498 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:50,501 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0728161334991455 s; generated tokens: 5 tokens; generate speed: 4.660630879675322 tokens/s +2024-07-30 14:33:50,506 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:50,506 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1967/2067], cost time 1.0846s, every example cost time is 1.0846, generate speed: 4.6102 tokens/s, avg speed: 10.2472 tokens/s, remaining time: 0:02:16 +pred is: + ['2-3'] + label is: + ['2–3 years'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:33:50,588 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:50,589 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 174, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:50,589 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:50,589 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:50,589 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:51,533 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:51,566 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:51,598 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:51,628 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:51,659 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:51,690 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:51,721 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:51,751 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:51,782 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:51,813 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:52,120 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5307888984680176 s; generated tokens: 20 tokens; generate speed: 13.065158768799273 tokens/s +2024-07-30 14:33:52,125 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:52,126 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1968/2067], cost time 1.5421s, every example cost time is 1.5421, generate speed: 12.9696 tokens/s, avg speed: 10.2488 tokens/s, remaining time: 0:02:15 +pred is: + ['1996'] + label is: + ['1996'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:33:52,239 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:52,240 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 423, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:52,240 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:52,240 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:52,240 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:53,187 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:53,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:53,252 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:53,283 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:53,314 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:53,345 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:53,376 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:53,408 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:53,439 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:53,470 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:53,781 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5399963855743408 s; generated tokens: 20 tokens; generate speed: 12.987043467989057 tokens/s +2024-07-30 14:33:53,785 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:53,786 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1969/2067], cost time 1.5518s, every example cost time is 1.5518, generate speed: 12.8884 tokens/s, avg speed: 10.2503 tokens/s, remaining time: 0:02:14 +pred is: + ['Licensed Local Pastor'] + label is: + ['Licensed Local Pastor'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:33:53,869 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:53,869 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:53,870 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:53,870 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:53,870 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:54,814 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:54,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:54,878 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:54,908 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:54,939 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:54,970 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:55,001 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:55,033 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:55,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:55,095 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:55,405 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.534315824508667 s; generated tokens: 20 tokens; generate speed: 13.035125937259096 tokens/s +2024-07-30 14:33:55,410 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:55,410 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1970/2067], cost time 1.5456s, every example cost time is 1.5456, generate speed: 12.9402 tokens/s, avg speed: 10.2518 tokens/s, remaining time: 0:02:12 +pred is: + ['Baptized Members'] + label is: + ['Baptized Members'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.54461676945185, Em score: 47.96954314720812, current_count: 1970 +2024-07-30 14:33:56,084 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:56,084 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 183, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:56,085 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:56,085 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:56,085 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:57,028 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:57,061 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:57,092 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:57,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:57,154 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:57,185 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:57,216 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:57,246 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:57,277 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:57,308 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:57,464 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3789172172546387 s; generated tokens: 15 tokens; generate speed: 10.87810044889012 tokens/s +2024-07-30 14:33:57,469 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:57,469 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1971/2067], cost time 1.3906s, every example cost time is 1.3906, generate speed: 10.7865 tokens/s, avg speed: 10.2521 tokens/s, remaining time: 0:02:11 +pred is: + ['Baptism'] + label is: + ['Baptism'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:33:57,551 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:57,552 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 258, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:57,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:57,552 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:57,552 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:58,496 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:58,530 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:58,561 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:58,592 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:58,595 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0424208641052246 s; generated tokens: 4 tokens; generate speed: 3.8372217381061837 tokens/s +2024-07-30 14:33:58,600 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:33:58,600 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1972/2067], cost time 1.0536s, every example cost time is 1.0536, generate speed: 3.7967 tokens/s, avg speed: 10.2496 tokens/s, remaining time: 0:02:09 +pred is: + ['lay servants'] + label is: + ['lay servants'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:33:58,683 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:33:58,683 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 166, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:33:58,683 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:58,684 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:33:58,684 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:33:59,627 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:59,660 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:59,696 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:59,727 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:59,758 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:59,789 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:59,820 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:59,851 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:59,882 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:33:59,913 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:00,224 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5400152206420898 s; generated tokens: 20 tokens; generate speed: 12.986884630699464 tokens/s +2024-07-30 14:34:00,229 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:00,229 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1973/2067], cost time 1.5512s, every example cost time is 1.5512, generate speed: 12.8931 tokens/s, avg speed: 10.2511 tokens/s, remaining time: 0:02:08 +pred is: + ['The United Methodist Church'] + label is: + ['United Methodist Church'] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +2024-07-30 14:34:00,312 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:00,312 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 187, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:00,312 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:00,313 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:00,313 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:01,256 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:01,289 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:01,320 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:01,351 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:01,382 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:01,413 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:01,443 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:01,474 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:01,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:01,536 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:01,844 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.530548095703125 s; generated tokens: 20 tokens; generate speed: 13.067214324168045 tokens/s +2024-07-30 14:34:01,848 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:01,849 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1974/2067], cost time 1.5418s, every example cost time is 1.5418, generate speed: 12.9718 tokens/s, avg speed: 10.2527 tokens/s, remaining time: 0:02:07 +pred is: + ['2000'] + label is: + ['2000'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:34:01,931 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:01,931 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 189, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:01,932 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:01,932 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:01,932 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:02,876 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:02,909 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:02,940 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:02,976 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:03,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:03,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:03,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:03,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:03,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:03,161 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:03,195 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2625741958618164 s; generated tokens: 11 tokens; generate speed: 8.712359270491463 tokens/s +2024-07-30 14:34:03,200 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:03,200 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1975/2067], cost time 1.2737s, every example cost time is 1.2737, generate speed: 8.6364 tokens/s, avg speed: 10.2519 tokens/s, remaining time: 0:02:05 +pred is: + ['11 million'] + label is: + ['11 million'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:34:03,282 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:03,283 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 260, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:03,283 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:03,283 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:03,284 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:04,228 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:04,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:04,292 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:04,324 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:04,355 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:04,386 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:04,418 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:04,449 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:04,480 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:04,511 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:04,727 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4437932968139648 s; generated tokens: 17 tokens; generate speed: 11.774538666659621 tokens/s +2024-07-30 14:34:04,732 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:04,733 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1976/2067], cost time 1.4550s, every example cost time is 1.4550, generate speed: 11.6835 tokens/s, avg speed: 10.2527 tokens/s, remaining time: 0:02:04 +pred is: + ['11.4 million'] + label is: + ['11.4 million'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:34:04,815 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:04,815 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 164, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:04,816 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:04,816 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:04,816 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:05,759 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:05,792 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:05,824 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:05,854 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:05,885 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:05,927 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:05,958 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:05,989 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:06,020 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:06,051 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:06,268 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4511487483978271 s; generated tokens: 17 tokens; generate speed: 11.714856949550642 tokens/s +2024-07-30 14:34:06,272 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:06,273 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1977/2067], cost time 1.4623s, every example cost time is 1.4623, generate speed: 11.6252 tokens/s, avg speed: 10.2534 tokens/s, remaining time: 0:02:03 +pred is: + ['1'] + label is: + ['Wesleyan Holiness Consortium'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:34:06,355 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:06,356 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 187, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:06,356 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:06,356 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:06,356 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:07,300 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:07,333 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:07,365 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:07,395 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:07,398 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0417022705078125 s; generated tokens: 4 tokens; generate speed: 3.8398687544859307 tokens/s +2024-07-30 14:34:07,403 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:07,403 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1978/2067], cost time 1.0530s, every example cost time is 1.0530, generate speed: 3.7987 tokens/s, avg speed: 10.2509 tokens/s, remaining time: 0:02:01 +pred is: + ['1754'] + label is: + ['1754–1763'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:34:07,485 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:07,486 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 162, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:07,486 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:07,486 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:07,486 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:08,429 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:08,462 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:08,493 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:08,524 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:08,555 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:08,586 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:08,617 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:08,648 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:08,678 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:08,709 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:09,021 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5344324111938477 s; generated tokens: 20 tokens; generate speed: 13.03413552405298 tokens/s +2024-07-30 14:34:09,026 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:09,026 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1979/2067], cost time 1.5456s, every example cost time is 1.5456, generate speed: 12.9404 tokens/s, avg speed: 10.2524 tokens/s, remaining time: 0:02:00 +pred is: + ['Along the frontiers between New France and the British colonies'] + label is: + ['primarily along the frontiers between New France and the British colonies'] +The F1/Em of this example is: {'F1': 95.0, 'Em': 0.0} +2024-07-30 14:34:09,110 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:09,110 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 281, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:09,111 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:09,111 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:09,111 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:10,056 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:10,089 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:10,121 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:10,152 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:10,182 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:10,214 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:10,244 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:10,275 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:10,306 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:10,337 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:10,370 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2591629028320312 s; generated tokens: 11 tokens; generate speed: 8.735962578995522 tokens/s +2024-07-30 14:34:10,375 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:10,376 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1980/2067], cost time 1.2704s, every example cost time is 1.2704, generate speed: 8.6586 tokens/s, avg speed: 10.2517 tokens/s, remaining time: 0:01:59 +pred is: + ['1755'] + label is: + ['1755'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.64708503492599, Em score: 48.03030303030303, current_count: 1980 +2024-07-30 14:34:11,060 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:11,060 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 207, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:11,061 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:11,061 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:11,061 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:12,005 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:12,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:12,070 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:12,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:12,131 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:12,162 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:12,192 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:12,223 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:12,254 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:12,285 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:12,594 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.532743215560913 s; generated tokens: 20 tokens; generate speed: 13.048500099007729 tokens/s +2024-07-30 14:34:12,599 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:12,599 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1981/2067], cost time 1.5445s, every example cost time is 1.5445, generate speed: 12.9493 tokens/s, avg speed: 10.2532 tokens/s, remaining time: 0:01:57 +pred is: + ['William Pitt'] + label is: + ['William Pitt'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:34:12,682 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:12,682 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 160, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:12,683 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:12,683 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:12,683 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:13,625 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:13,658 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:13,690 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:13,720 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:13,724 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0406434535980225 s; generated tokens: 4 tokens; generate speed: 3.8437756814497885 tokens/s +2024-07-30 14:34:13,729 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:13,729 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1982/2067], cost time 1.0518s, every example cost time is 1.0518, generate speed: 3.8031 tokens/s, avg speed: 10.2507 tokens/s, remaining time: 0:01:56 +pred is: + ['French Louisiana'] + label is: + ['territory east of the Mississippi to Great Britain'] +The F1/Em of this example is: {'F1': 11.11111111111111, 'Em': 0.0} +2024-07-30 14:34:13,819 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:13,819 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 212, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:13,820 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:13,820 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:13,820 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:14,764 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:14,796 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:14,827 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:14,858 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:14,889 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:14,920 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:14,956 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:14,986 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:15,017 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:15,048 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:15,357 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5367815494537354 s; generated tokens: 20 tokens; generate speed: 13.014211425891471 tokens/s +2024-07-30 14:34:15,362 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:15,362 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1983/2067], cost time 1.5483s, every example cost time is 1.5483, generate speed: 12.9173 tokens/s, avg speed: 10.2522 tokens/s, remaining time: 0:01:54 +pred is: + ['1744'] + label is: + ['1740s'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:34:15,445 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:15,446 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 166, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:15,446 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:15,446 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:15,447 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:16,389 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:16,422 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:16,453 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:16,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:16,515 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:16,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:16,576 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:16,579 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1322503089904785 s; generated tokens: 7 tokens; generate speed: 6.182378529215191 tokens/s +2024-07-30 14:34:16,584 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:16,584 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1984/2067], cost time 1.1441s, every example cost time is 1.1441, generate speed: 6.1185 tokens/s, avg speed: 10.2505 tokens/s, remaining time: 0:01:53 +pred is: + ['1754-1760'] + label is: + ['declaration of war in 1756 to the signing of the peace treaty in 1763'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:34:16,675 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:16,675 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:16,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:16,676 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:16,676 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:17,619 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:17,652 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:17,684 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:17,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:17,745 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:17,748 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0716981887817383 s; generated tokens: 5 tokens; generate speed: 4.66549262874447 tokens/s +2024-07-30 14:34:17,753 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:17,753 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1985/2067], cost time 1.0832s, every example cost time is 1.0832, generate speed: 4.6161 tokens/s, avg speed: 10.2482 tokens/s, remaining time: 0:01:52 +pred is: + ['75,000'] + label is: + ['about 75,000'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:34:17,835 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:17,835 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 188, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:17,835 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:17,835 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:17,836 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:18,779 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:18,812 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:18,843 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:18,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:18,905 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:18,907 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.07163405418396 s; generated tokens: 5 tokens; generate speed: 4.665771846721927 tokens/s +2024-07-30 14:34:18,912 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:18,912 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1986/2067], cost time 1.0827s, every example cost time is 1.0827, generate speed: 4.6180 tokens/s, avg speed: 10.2460 tokens/s, remaining time: 0:01:50 +pred is: + ['20:1'] + label is: + ['20 to 1'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:34:18,995 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:18,995 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 193, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:18,996 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:18,996 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:18,996 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:19,939 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:19,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:20,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:20,034 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:20,065 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:20,103 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:20,135 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:20,165 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:20,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:20,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:20,538 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5418782234191895 s; generated tokens: 20 tokens; generate speed: 12.971192988022773 tokens/s +2024-07-30 14:34:20,543 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:20,543 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1987/2067], cost time 1.5531s, every example cost time is 1.5531, generate speed: 12.8776 tokens/s, avg speed: 10.2475 tokens/s, remaining time: 0:01:49 +pred is: + ['Native tribes'] + label is: + ['native tribes'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:34:20,626 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:20,627 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 301, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:20,627 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:20,627 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:20,628 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:21,573 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:21,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:21,638 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:21,668 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:21,699 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:21,730 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:21,761 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:21,792 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:21,823 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:21,853 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:21,978 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3506641387939453 s; generated tokens: 14 tokens; generate speed: 10.365271126914708 tokens/s +2024-07-30 14:34:21,983 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:21,983 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1988/2067], cost time 1.3618s, every example cost time is 1.3618, generate speed: 10.2802 tokens/s, avg speed: 10.2475 tokens/s, remaining time: 0:01:48 +pred is: + ['Catawba'] + label is: + ['Catawba, Muskogee-speaking Creek and Choctaw'] +The F1/Em of this example is: {'F1': 18.181818181818183, 'Em': 0.0} +2024-07-30 14:34:22,066 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:22,066 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 147, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:22,066 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:22,066 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:22,067 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:23,008 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:23,042 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:23,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:23,107 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:23,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:23,140 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0735993385314941 s; generated tokens: 5 tokens; generate speed: 4.657230887305846 tokens/s +2024-07-30 14:34:23,145 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:23,145 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1989/2067], cost time 1.0848s, every example cost time is 1.0848, generate speed: 4.6092 tokens/s, avg speed: 10.2453 tokens/s, remaining time: 0:01:46 +pred is: + ['3,000'] + label is: + ['no French regular army troops were stationed in North America'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:34:23,228 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:23,228 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 213, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:23,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:23,229 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:23,229 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:24,173 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:24,206 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:24,237 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:24,268 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:24,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:24,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:24,360 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:24,391 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:24,422 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:24,453 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:24,517 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.287280797958374 s; generated tokens: 12 tokens; generate speed: 9.321975453243757 tokens/s +2024-07-30 14:34:24,521 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:24,522 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1990/2067], cost time 1.2985s, every example cost time is 1.2985, generate speed: 9.2417 tokens/s, avg speed: 10.2448 tokens/s, remaining time: 0:01:45 +pred is: + ['3,000 miles (4,800 km)'] + label is: + ['about 3,000 miles (4,800 km) between June and November 1749.'] +The F1/Em of this example is: {'F1': 66.66666666666666, 'Em': 0.0} +F1 score: 62.51868741965481, Em score: 47.88944723618091, current_count: 1990 +2024-07-30 14:34:25,209 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:25,209 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 188, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:25,209 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:25,210 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:25,210 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:26,153 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:26,186 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:26,217 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:26,248 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:26,279 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:26,309 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:26,340 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:26,371 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:26,402 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:26,438 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:26,747 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.536879062652588 s; generated tokens: 20 tokens; generate speed: 13.013385689229738 tokens/s +2024-07-30 14:34:26,752 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:26,752 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1991/2067], cost time 1.5485s, every example cost time is 1.5485, generate speed: 12.9161 tokens/s, avg speed: 10.2463 tokens/s, remaining time: 0:01:43 +pred is: + ['They ignored it'] + label is: + ['informed Céloron that they owned the Ohio Country and that they would trade with the British regardless of the French'] +The F1/Em of this example is: {'F1': 8.695652173913045, 'Em': 0.0} +2024-07-30 14:34:26,836 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:26,837 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 207, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:26,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:26,837 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:26,838 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:27,781 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:27,815 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:27,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:27,879 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:27,910 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:27,941 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:27,972 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:28,003 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:28,034 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:28,064 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:28,372 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.534740686416626 s; generated tokens: 20 tokens; generate speed: 13.031517426371748 tokens/s +2024-07-30 14:34:28,377 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:28,378 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1992/2067], cost time 1.5460s, every example cost time is 1.5460, generate speed: 12.9366 tokens/s, avg speed: 10.2478 tokens/s, remaining time: 0:01:42 +pred is: + ['Badly'] + label is: + ['very badly disposed towards the French, and are entirely devoted to the English'] +The F1/Em of this example is: {'F1': 7.4074074074074066, 'Em': 0.0} +2024-07-30 14:34:28,461 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:28,461 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 257, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:28,461 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:28,462 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:28,462 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:29,406 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:29,439 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:29,471 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:29,502 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:29,533 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:29,564 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:29,595 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:29,626 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:29,657 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:29,688 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:29,721 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2594664096832275 s; generated tokens: 11 tokens; generate speed: 8.733857382323238 tokens/s +2024-07-30 14:34:29,726 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:29,727 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1993/2067], cost time 1.2706s, every example cost time is 1.2706, generate speed: 8.6571 tokens/s, avg speed: 10.2471 tokens/s, remaining time: 0:01:41 +pred is: + ['1749'] + label is: + ['1749'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:34:29,809 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:29,809 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 183, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:29,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:29,810 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:29,810 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:30,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:30,786 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:30,817 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:30,849 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:30,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:30,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:30,914 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1039738655090332 s; generated tokens: 6 tokens; generate speed: 5.434911266883523 tokens/s +2024-07-30 14:34:30,919 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:30,919 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1994/2067], cost time 1.1152s, every example cost time is 1.1152, generate speed: 5.3804 tokens/s, avg speed: 10.2451 tokens/s, remaining time: 0:01:39 +pred is: + ["King George's War"] + label is: + ["King George's War"] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:34:31,001 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:31,002 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 261, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:31,002 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:31,002 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:31,002 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:31,947 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:31,981 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:32,013 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:32,044 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:32,075 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:32,106 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:32,137 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:32,167 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:32,198 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:32,201 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1981220245361328 s; generated tokens: 9 tokens; generate speed: 7.511755744148395 tokens/s +2024-07-30 14:34:32,205 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:32,206 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1995/2067], cost time 1.2093s, every example cost time is 1.2093, generate speed: 7.4421 tokens/s, avg speed: 10.2439 tokens/s, remaining time: 0:01:38 +pred is: + ['Marquis de la Jonquière'] + label is: + ['Marquis de la Jonquière'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:34:32,288 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:32,288 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 312, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:32,288 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:32,289 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:32,289 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:33,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:33,267 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:33,299 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:33,329 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:33,361 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:33,391 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:33,422 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:33,453 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:33,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:33,515 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:33,610 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3212480545043945 s; generated tokens: 13 tokens; generate speed: 9.839181942921652 tokens/s +2024-07-30 14:34:33,615 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:33,615 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1996/2067], cost time 1.3325s, every example cost time is 1.3325, generate speed: 9.7561 tokens/s, avg speed: 10.2436 tokens/s, remaining time: 0:01:37 +pred is: + ['Paul Marin de la Malgue'] + label is: + ['Paul Marin de la Malgue'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:34:33,698 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:33,699 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 250, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:33,699 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:33,699 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:33,699 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:34,643 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:34,676 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:34,707 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:34,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:34,769 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:34,800 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:34,831 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:34,861 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:34,892 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:34,923 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:35,231 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5318043231964111 s; generated tokens: 20 tokens; generate speed: 13.056497946334336 tokens/s +2024-07-30 14:34:35,236 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:35,237 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1997/2067], cost time 1.5430s, every example cost time is 1.5430, generate speed: 12.9617 tokens/s, avg speed: 10.2452 tokens/s, remaining time: 0:01:35 +pred is: + ['Colonel of the Iroquois'] + label is: + ['British Superintendent for Indian Affairs in the New York region and beyond'] +The F1/Em of this example is: {'F1': 20.0, 'Em': 0.0} +2024-07-30 14:34:35,320 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:35,320 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 194, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:35,320 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:35,321 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:35,321 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:36,264 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:36,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:36,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:36,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:36,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:36,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:36,451 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:36,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:36,513 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:36,543 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:36,851 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5297887325286865 s; generated tokens: 20 tokens; generate speed: 13.073700684761032 tokens/s +2024-07-30 14:34:36,855 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:36,856 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1998/2067], cost time 1.5410s, every example cost time is 1.5410, generate speed: 12.9788 tokens/s, avg speed: 10.2467 tokens/s, remaining time: 0:01:34 +pred is: + ['The Ohio Company'] + label is: + ['Ohio Company'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:34:36,939 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:36,939 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 178, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:36,939 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:36,939 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:36,940 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:37,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:37,916 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:37,947 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:37,977 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:38,008 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:38,039 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:38,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:38,100 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:38,130 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:38,161 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:38,480 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5404365062713623 s; generated tokens: 20 tokens; generate speed: 12.983332918024738 tokens/s +2024-07-30 14:34:38,485 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:38,485 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[1999/2067], cost time 1.5517s, every example cost time is 1.5517, generate speed: 12.8892 tokens/s, avg speed: 10.2482 tokens/s, remaining time: 0:01:33 +pred is: + ['Jacques Legardeur de Saint-Pierre'] + label is: + ['Jacques Legardeur de Saint-Pierre'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:34:38,569 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:38,569 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 187, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:38,569 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:38,570 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:38,570 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:39,513 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:39,547 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:39,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:39,581 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0107965469360352 s; generated tokens: 3 tokens; generate speed: 2.9679563202839523 tokens/s +2024-07-30 14:34:39,585 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:39,586 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2000/2067], cost time 1.0220s, every example cost time is 1.0220, generate speed: 2.9353 tokens/s, avg speed: 10.2455 tokens/s, remaining time: 0:01:31 +pred is: + ['500'] + label is: + ['Contrecœur led 500 men south from Fort Venango on April 5, 1754'] +The F1/Em of this example is: {'F1': 7.4074074074074066, 'Em': 0.0} +F1 score: 62.515349216050915, Em score: 47.9, current_count: 2000 +2024-07-30 14:34:40,271 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:40,271 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 271, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:40,272 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:40,272 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:40,272 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:41,217 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:41,250 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:41,281 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:41,313 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:41,344 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:41,375 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:41,406 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:41,437 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:41,468 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:41,499 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:41,807 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5348608493804932 s; generated tokens: 20 tokens; generate speed: 13.030497199842241 tokens/s +2024-07-30 14:34:41,812 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:41,813 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2001/2067], cost time 1.5468s, every example cost time is 1.5468, generate speed: 12.9303 tokens/s, avg speed: 10.2470 tokens/s, remaining time: 0:01:30 +pred is: + ['He continued toward Fort Duquesne'] + label is: + ['with Tanaghrisson and his party, surprised the Canadians on May 28 in what became known as the Battle of Jumonville Glen'] +The F1/Em of this example is: {'F1': 3.9215686274509802, 'Em': 0.0} +2024-07-30 14:34:41,897 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:41,897 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 190, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:41,898 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:41,898 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:41,898 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:42,841 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:42,874 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:42,905 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:42,936 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:42,967 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:43,000 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:43,031 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:43,062 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:43,093 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:43,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:43,434 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.535658359527588 s; generated tokens: 20 tokens; generate speed: 13.023730099807205 tokens/s +2024-07-30 14:34:43,442 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:43,442 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2002/2067], cost time 1.5500s, every example cost time is 1.5500, generate speed: 12.9030 tokens/s, avg speed: 10.2485 tokens/s, remaining time: 0:01:28 +pred is: + ['To dislodge the French'] + label is: + ['dislodge the French'] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +2024-07-30 14:34:43,526 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:43,527 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 170, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:43,527 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:43,528 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:43,528 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:44,471 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:44,504 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:44,535 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:44,566 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:44,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:44,628 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:44,660 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:44,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:44,722 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:44,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:44,818 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2898881435394287 s; generated tokens: 12 tokens; generate speed: 9.303132260036305 tokens/s +2024-07-30 14:34:44,823 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:44,823 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2003/2067], cost time 1.3015s, every example cost time is 1.3015, generate speed: 9.2200 tokens/s, avg speed: 10.2480 tokens/s, remaining time: 0:01:27 +pred is: + ['Albany Congress'] + label is: + ['Albany Congress'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:34:44,905 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:44,905 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 177, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:44,906 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:44,906 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:44,906 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:45,849 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:45,887 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:45,919 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:45,922 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0156662464141846 s; generated tokens: 3 tokens; generate speed: 2.9537261975491624 tokens/s +2024-07-30 14:34:45,927 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:45,927 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2004/2067], cost time 1.0270s, every example cost time is 1.0270, generate speed: 2.9211 tokens/s, avg speed: 10.2453 tokens/s, remaining time: 0:01:26 +pred is: + ['Braddock'] + label is: + ['Braddock (with George Washington as one of his aides) led about 1,500 army troops'] +The F1/Em of this example is: {'F1': 6.25, 'Em': 0.0} +2024-07-30 14:34:46,010 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:46,010 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 188, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:46,011 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:46,011 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:46,011 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:46,954 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:46,987 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:47,019 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:47,050 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:47,081 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:47,112 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:47,144 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:47,175 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:47,206 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:47,237 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:47,549 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5375251770019531 s; generated tokens: 20 tokens; generate speed: 13.00791707294078 tokens/s +2024-07-30 14:34:47,554 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:47,554 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2005/2067], cost time 1.5487s, every example cost time is 1.5487, generate speed: 12.9140 tokens/s, avg speed: 10.2468 tokens/s, remaining time: 0:01:24 +pred is: + ["Shirley's"] + label is: + ['Shirley and Johnson.'] +The F1/Em of this example is: {'F1': 22.22222222222222, 'Em': 0.0} +2024-07-30 14:34:47,637 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:47,637 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 264, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:47,638 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:47,638 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:47,638 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:48,584 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:48,617 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:48,649 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:48,680 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:48,711 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:48,742 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:48,774 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:48,805 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:48,836 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:48,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:48,932 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2939021587371826 s; generated tokens: 12 tokens; generate speed: 9.274271566029158 tokens/s +2024-07-30 14:34:48,937 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:48,937 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2006/2067], cost time 1.3055s, every example cost time is 1.3055, generate speed: 9.1917 tokens/s, avg speed: 10.2463 tokens/s, remaining time: 0:01:23 +pred is: + ['Vaudreuil'] + label is: + ['Marquis de Vaudreuil.'] +The F1/Em of this example is: {'F1': 28.57142857142857, 'Em': 0.0} +2024-07-30 14:34:49,021 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:49,021 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 267, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:49,022 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:49,022 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:49,022 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:49,967 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:50,000 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:50,031 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:50,062 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:50,093 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:50,125 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:50,156 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:50,187 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:50,218 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:50,249 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:50,563 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.540539264678955 s; generated tokens: 20 tokens; generate speed: 12.982466892311216 tokens/s +2024-07-30 14:34:50,568 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:50,568 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2007/2067], cost time 1.5519s, every example cost time is 1.5519, generate speed: 12.8877 tokens/s, avg speed: 10.2478 tokens/s, remaining time: 0:01:22 +pred is: + ['Colonel Monckton'] + label is: + ['Colonel Monckton'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:34:50,650 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:50,651 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 175, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:50,651 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:50,651 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:50,651 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:51,595 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:51,628 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:51,659 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:51,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:51,722 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:51,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:51,784 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:51,815 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:51,846 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:51,877 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:52,188 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.536745548248291 s; generated tokens: 20 tokens; generate speed: 13.01451630870032 tokens/s +2024-07-30 14:34:52,193 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:52,194 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2008/2067], cost time 1.5481s, every example cost time is 1.5481, generate speed: 12.9190 tokens/s, avg speed: 10.2493 tokens/s, remaining time: 0:01:20 +pred is: + ['William Shirley'] + label is: + ['William Shirley'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:34:52,276 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:52,276 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 204, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:52,276 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:52,277 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:52,277 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:53,220 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:53,253 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:53,284 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:53,315 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:53,347 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:53,378 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:53,410 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:53,441 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:53,472 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:53,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:53,814 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5371346473693848 s; generated tokens: 20 tokens; generate speed: 13.011221908391382 tokens/s +2024-07-30 14:34:53,819 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:53,819 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2009/2067], cost time 1.5484s, every example cost time is 1.5484, generate speed: 12.9169 tokens/s, avg speed: 10.2508 tokens/s, remaining time: 0:01:19 +pred is: + ['Major General James Abercrombie'] + label is: + ['Major General James Abercrombie'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:34:53,902 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:53,902 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 218, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:53,903 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:53,903 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:53,903 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:54,847 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:54,880 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:54,911 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:54,942 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:54,973 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:55,004 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:55,036 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:55,067 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:55,098 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:55,129 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:55,440 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5366380214691162 s; generated tokens: 20 tokens; generate speed: 13.015427003998525 tokens/s +2024-07-30 14:34:55,445 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:55,445 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2010/2067], cost time 1.5477s, every example cost time is 1.5477, generate speed: 12.9220 tokens/s, avg speed: 10.2523 tokens/s, remaining time: 0:01:17 +pred is: + ['1'] + label is: + ['Oneida Carry'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 62.47512287803793, Em score: 47.86069651741293, current_count: 2010 +2024-07-30 14:34:56,133 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:56,133 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 209, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:56,134 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:56,134 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:56,134 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:57,078 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:57,111 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:57,142 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:57,173 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:57,204 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:57,235 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:57,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:57,269 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.135159969329834 s; generated tokens: 7 tokens; generate speed: 6.166531756870003 tokens/s +2024-07-30 14:34:57,274 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:57,275 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2011/2067], cost time 1.1466s, every example cost time is 1.1466, generate speed: 6.1050 tokens/s, avg speed: 10.2505 tokens/s, remaining time: 0:01:16 +pred is: + ['Abercrombie'] + label is: + ['Abercrombie'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:34:57,357 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:57,357 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 205, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:57,358 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:57,358 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:57,358 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:58,301 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:58,334 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:58,366 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:58,397 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:58,428 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:58,459 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:58,490 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:58,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:58,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:58,584 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:58,896 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5372159481048584 s; generated tokens: 20 tokens; generate speed: 13.010533767007038 tokens/s +2024-07-30 14:34:58,901 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:34:58,901 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2012/2067], cost time 1.5495s, every example cost time is 1.5495, generate speed: 12.9077 tokens/s, avg speed: 10.2520 tokens/s, remaining time: 0:01:15 +pred is: + ["An attack on New France's capital, Quebec"] + label is: + ["attack on New France's capital, Quebec"] +The F1/Em of this example is: {'F1': 93.33333333333333, 'Em': 0.0} +2024-07-30 14:34:58,985 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:34:58,985 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 230, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:34:58,986 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:58,986 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:34:58,986 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:34:59,931 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:59,964 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:34:59,995 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:00,027 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:00,058 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:00,089 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:00,120 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:00,152 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:00,183 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:00,214 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:00,310 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3240900039672852 s; generated tokens: 13 tokens; generate speed: 9.818063697368714 tokens/s +2024-07-30 14:35:00,315 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:00,315 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2013/2067], cost time 1.3353s, every example cost time is 1.3353, generate speed: 9.7356 tokens/s, avg speed: 10.2518 tokens/s, remaining time: 0:01:13 +pred is: + ['A'] + label is: + ['French irregular forces (Canadian scouts and Indians)'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:35:00,398 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:00,398 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 271, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:00,399 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:00,399 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:00,399 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:01,344 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:01,377 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:01,408 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:01,439 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:01,471 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:01,502 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:01,533 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:01,565 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:01,596 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:01,627 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:01,959 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5596885681152344 s; generated tokens: 20 tokens; generate speed: 12.823072765204971 tokens/s +2024-07-30 14:35:01,964 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:01,964 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2014/2067], cost time 1.5710s, every example cost time is 1.5710, generate speed: 12.7309 tokens/s, avg speed: 10.2532 tokens/s, remaining time: 0:01:12 +pred is: + ['The British blockade of the French coastline limited French shipping.'] + label is: + ['British blockade of the French coastline limited French shipping.'] +The F1/Em of this example is: {'F1': 94.73684210526316, 'Em': 0.0} +2024-07-30 14:35:02,048 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:02,048 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 195, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:02,048 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:02,049 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:02,049 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:02,992 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:03,025 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:03,057 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:03,089 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:03,148 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:03,179 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:03,211 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:03,242 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:03,274 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:03,306 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:03,620 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5712127685546875 s; generated tokens: 20 tokens; generate speed: 12.729020792261899 tokens/s +2024-07-30 14:35:03,625 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:03,625 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2015/2067], cost time 1.5824s, every example cost time is 1.5824, generate speed: 12.6386 tokens/s, avg speed: 10.2546 tokens/s, remaining time: 0:01:11 +pred is: + ['The British failures in North America, combined with other failures in the European theater'] + label is: + ['British failures in North America, combined with other failures in the European theater'] +The F1/Em of this example is: {'F1': 96.2962962962963, 'Em': 0.0} +2024-07-30 14:35:03,709 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:03,710 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 179, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:03,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:03,710 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:03,711 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:04,654 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:04,688 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:04,719 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:04,751 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:04,754 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0428485870361328 s; generated tokens: 4 tokens; generate speed: 3.835647906824471 tokens/s +2024-07-30 14:35:04,758 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:04,759 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2016/2067], cost time 1.0541s, every example cost time is 1.0541, generate speed: 3.7946 tokens/s, avg speed: 10.2521 tokens/s, remaining time: 0:01:09 +pred is: + ['3600'] + label is: + ['3,600'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:35:04,841 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:04,841 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 194, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:04,842 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:04,842 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:04,842 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:05,785 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:05,818 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:05,849 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:05,881 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:05,913 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:05,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:05,975 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:06,006 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:06,037 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:06,068 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:06,381 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5392959117889404 s; generated tokens: 20 tokens; generate speed: 12.992953367073119 tokens/s +2024-07-30 14:35:06,386 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:06,387 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2017/2067], cost time 1.5508s, every example cost time is 1.5508, generate speed: 12.8964 tokens/s, avg speed: 10.2536 tokens/s, remaining time: 0:01:08 +pred is: + ['Invasion of Britain'] + label is: + ['invasion of Britain, to draw British resources away from North America and the European mainland'] +The F1/Em of this example is: {'F1': 28.57142857142857, 'Em': 0.0} +2024-07-30 14:35:06,470 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:06,470 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 168, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:06,471 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:06,471 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:06,471 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:07,415 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:07,447 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:07,480 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:07,511 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:07,514 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0427768230438232 s; generated tokens: 4 tokens; generate speed: 3.835911876449423 tokens/s +2024-07-30 14:35:07,519 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:07,519 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2018/2067], cost time 1.0539s, every example cost time is 1.0539, generate speed: 3.7954 tokens/s, avg speed: 10.2511 tokens/s, remaining time: 0:01:07 +pred is: + ['James Wolfe'] + label is: + ['James Wolfe'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:35:07,629 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:07,629 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 172, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:07,630 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:07,630 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:07,630 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:08,573 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:08,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:08,637 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:08,668 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:08,699 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:08,730 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:08,762 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:08,793 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:08,824 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:08,855 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:09,166 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5355644226074219 s; generated tokens: 20 tokens; generate speed: 13.024526816035216 tokens/s +2024-07-30 14:35:09,171 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:09,171 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2019/2067], cost time 1.5472s, every example cost time is 1.5472, generate speed: 12.9268 tokens/s, avg speed: 10.2526 tokens/s, remaining time: 0:01:05 +pred is: + ['Governor Vaudreuil'] + label is: + ['Governor Vaudreuil'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:35:09,254 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:09,254 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 324, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:09,254 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:09,255 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:09,255 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:10,200 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:10,233 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:10,265 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:10,296 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:10,327 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:10,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:10,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:10,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:10,453 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:10,484 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:10,518 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2629241943359375 s; generated tokens: 11 tokens; generate speed: 8.70994478475721 tokens/s +2024-07-30 14:35:10,523 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:10,523 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2020/2067], cost time 1.2741s, every example cost time is 1.2741, generate speed: 8.6336 tokens/s, avg speed: 10.2519 tokens/s, remaining time: 0:01:04 +pred is: + ['1763'] + label is: + ['signing of the Treaty of Paris on 10 February 1763'] +The F1/Em of this example is: {'F1': 10.0, 'Em': 0.0} +F1 score: 62.47422519067454, Em score: 47.772277227722775, current_count: 2020 +2024-07-30 14:35:11,220 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:11,221 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 215, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:11,221 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:11,222 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:11,222 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:12,166 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:12,199 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:12,230 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:12,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:12,292 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:12,295 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0731866359710693 s; generated tokens: 5 tokens; generate speed: 4.659021862936046 tokens/s +2024-07-30 14:35:12,300 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:12,300 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2021/2067], cost time 1.0846s, every example cost time is 1.0846, generate speed: 4.6098 tokens/s, avg speed: 10.2497 tokens/s, remaining time: 0:01:02 +pred is: + ['80,000'] + label is: + ['80,000'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:35:12,383 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:12,383 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 232, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:12,383 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:12,384 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:12,384 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:13,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:13,361 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:13,392 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:13,424 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:13,455 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:13,486 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:13,517 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:13,549 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:13,580 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:13,611 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:13,675 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2914862632751465 s; generated tokens: 12 tokens; generate speed: 9.291620314697411 tokens/s +2024-07-30 14:35:13,680 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:13,680 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2022/2067], cost time 1.3027s, every example cost time is 1.3027, generate speed: 9.2119 tokens/s, avg speed: 10.2492 tokens/s, remaining time: 0:01:01 +pred is: + ['King George III'] + label is: + ['King George III'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:35:13,793 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:13,793 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 230, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:13,794 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:13,794 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:13,794 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:14,738 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:14,771 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:14,803 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:14,834 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:14,865 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:14,896 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:14,927 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:14,958 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:14,989 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:15,021 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:15,209 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4147837162017822 s; generated tokens: 16 tokens; generate speed: 11.309149106518282 tokens/s +2024-07-30 14:35:15,214 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:15,214 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2023/2067], cost time 1.4263s, every example cost time is 1.4263, generate speed: 11.2180 tokens/s, avg speed: 10.2497 tokens/s, remaining time: 0:01:00 +pred is: + ['Cuba'] + label is: + ['Most went to Cuba,'] +The F1/Em of this example is: {'F1': 22.22222222222222, 'Em': 0.0} +2024-07-30 14:35:15,297 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:15,297 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 237, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:15,298 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:15,298 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:15,298 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:16,243 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:16,276 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:16,307 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:16,310 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0115387439727783 s; generated tokens: 3 tokens; generate speed: 2.965778639597747 tokens/s +2024-07-30 14:35:16,315 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:16,315 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2024/2067], cost time 1.0226s, every example cost time is 1.0226, generate speed: 2.9338 tokens/s, avg speed: 10.2470 tokens/s, remaining time: 0:00:58 +pred is: + ['1'] + label is: + ['force'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:35:16,397 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:16,397 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 175, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:16,398 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:16,398 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:16,398 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:17,341 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:17,373 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:17,404 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:17,436 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:17,439 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0404791831970215 s; generated tokens: 4 tokens; generate speed: 3.8443825350829477 tokens/s +2024-07-30 14:35:17,443 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:17,444 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2025/2067], cost time 1.0515s, every example cost time is 1.0515, generate speed: 3.8042 tokens/s, avg speed: 10.2445 tokens/s, remaining time: 0:00:57 +pred is: + ['Standard Model'] + label is: + ['Standard Model'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:35:17,526 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:17,526 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 296, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:17,526 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:17,527 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:17,527 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:18,471 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:18,506 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:18,539 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:18,570 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:18,602 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:18,633 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:18,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:18,696 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:18,727 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:18,758 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:19,072 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.544523000717163 s; generated tokens: 20 tokens; generate speed: 12.94898165369727 tokens/s +2024-07-30 14:35:19,076 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:19,077 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2026/2067], cost time 1.5556s, every example cost time is 1.5556, generate speed: 12.8569 tokens/s, avg speed: 10.2460 tokens/s, remaining time: 0:00:56 +pred is: + ['Aristotle'] + label is: + ['Aristotle'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:35:19,159 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:19,159 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:19,159 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:19,160 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:19,160 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:20,103 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:20,135 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:20,167 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:20,198 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:20,229 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:20,260 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:20,291 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:20,322 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:20,353 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:20,408 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:20,473 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3127684593200684 s; generated tokens: 12 tokens; generate speed: 9.14098744131562 tokens/s +2024-07-30 14:35:20,478 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:20,478 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2027/2067], cost time 1.3239s, every example cost time is 1.3239, generate speed: 9.0639 tokens/s, avg speed: 10.2454 tokens/s, remaining time: 0:00:54 +pred is: + ['17th century'] + label is: + ['17th century'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:35:20,560 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:20,560 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 287, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:20,561 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:20,561 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:20,561 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:21,506 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:21,539 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:21,570 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:21,601 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:21,632 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:21,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:21,695 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:21,726 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:21,757 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:21,760 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1989326477050781 s; generated tokens: 9 tokens; generate speed: 7.50667689067208 tokens/s +2024-07-30 14:35:21,765 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:21,765 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2028/2067], cost time 1.2099s, every example cost time is 1.2099, generate speed: 7.4386 tokens/s, avg speed: 10.2442 tokens/s, remaining time: 0:00:53 +pred is: + ['1'] + label is: + ['Newton'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:35:21,847 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:21,847 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 279, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:21,848 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:21,848 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:21,848 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:22,793 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:22,826 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:22,858 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:22,889 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:22,920 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:22,951 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:22,982 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:23,014 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:23,045 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:23,076 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:23,388 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5394845008850098 s; generated tokens: 20 tokens; generate speed: 12.991361711340723 tokens/s +2024-07-30 14:35:23,393 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:23,393 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2029/2067], cost time 1.5506s, every example cost time is 1.5506, generate speed: 12.8979 tokens/s, avg speed: 10.2457 tokens/s, remaining time: 0:00:51 +pred is: + ['1'] + label is: + ['laws of physics'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:35:23,475 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:23,475 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 269, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:23,476 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:23,476 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:23,476 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:24,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:24,454 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:24,485 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:24,518 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:24,550 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:24,581 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:24,612 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:24,644 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:24,675 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:24,706 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:25,018 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.541656494140625 s; generated tokens: 20 tokens; generate speed: 12.97305857434131 tokens/s +2024-07-30 14:35:25,023 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:25,023 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2030/2067], cost time 1.5528s, every example cost time is 1.5528, generate speed: 12.8797 tokens/s, avg speed: 10.2472 tokens/s, remaining time: 0:00:50 +pred is: + ['1'] + label is: + ['inertia'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 62.42372271299743, Em score: 47.783251231527096, current_count: 2030 +2024-07-30 14:35:25,719 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:25,720 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 190, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:25,720 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:25,720 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:25,720 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:26,664 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:26,696 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:26,728 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:26,759 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:26,790 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:26,822 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:26,825 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.1042816638946533 s; generated tokens: 6 tokens; generate speed: 5.433396384432215 tokens/s +2024-07-30 14:35:26,830 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:26,830 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2031/2067], cost time 1.1158s, every example cost time is 1.1158, generate speed: 5.3773 tokens/s, avg speed: 10.2452 tokens/s, remaining time: 0:00:49 +pred is: + ["Newton's Second Law"] + label is: + ["Newton's Second Law"] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:35:26,912 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:26,912 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 195, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:26,913 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:26,913 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:26,913 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:27,857 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:27,890 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:27,921 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:27,953 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:27,984 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:28,015 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:28,046 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:28,077 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:28,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:28,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:28,478 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5650441646575928 s; generated tokens: 20 tokens; generate speed: 12.779192083934378 tokens/s +2024-07-30 14:35:28,483 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:28,484 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2032/2067], cost time 1.5763s, every example cost time is 1.5763, generate speed: 12.6877 tokens/s, avg speed: 10.2466 tokens/s, remaining time: 0:00:47 +pred is: + ["Newton's Third Law"] + label is: + ["Newton's Third"] +The F1/Em of this example is: {'F1': 83.33333333333333, 'Em': 0.0} +2024-07-30 14:35:28,566 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:28,567 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 160, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:28,567 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:28,567 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:28,568 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:29,510 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:29,546 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:29,578 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:29,609 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:29,640 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:29,671 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:29,705 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:29,737 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:29,768 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:29,771 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2027614116668701 s; generated tokens: 9 tokens; generate speed: 7.4827808014951 tokens/s +2024-07-30 14:35:29,775 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:29,776 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2033/2067], cost time 1.2142s, every example cost time is 1.2142, generate speed: 7.4123 tokens/s, avg speed: 10.2453 tokens/s, remaining time: 0:00:46 +pred is: + ['The center of mass of the system'] + label is: + ['center of mass'] +The F1/Em of this example is: {'F1': 55.55555555555556, 'Em': 0.0} +2024-07-30 14:35:29,858 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:29,859 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 131, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:29,859 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:29,859 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:29,860 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:30,802 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:30,835 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:30,866 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:30,898 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:30,929 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:30,961 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:30,992 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:31,024 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:31,055 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:31,086 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:31,401 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5407588481903076 s; generated tokens: 20 tokens; generate speed: 12.980616676964681 tokens/s +2024-07-30 14:35:31,405 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:31,406 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2034/2067], cost time 1.5520s, every example cost time is 1.5520, generate speed: 12.8862 tokens/s, avg speed: 10.2468 tokens/s, remaining time: 0:00:45 +pred is: + ['1'] + label is: + ['intuitive understanding'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:35:31,487 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:31,488 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 287, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:31,488 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:31,488 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:31,489 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:32,434 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:32,467 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:32,498 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:32,530 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:32,561 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:32,592 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:32,623 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:32,654 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:32,685 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:32,716 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:32,900 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4115359783172607 s; generated tokens: 15 tokens; generate speed: 10.626721692125766 tokens/s +2024-07-30 14:35:32,905 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:32,905 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2035/2067], cost time 1.4227s, every example cost time is 1.4227, generate speed: 10.5431 tokens/s, avg speed: 10.2470 tokens/s, remaining time: 0:00:43 +pred is: + ['1'] + label is: + ['vector quantities'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:35:32,988 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:32,988 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 228, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:32,988 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:32,989 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:32,989 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:33,933 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:33,966 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:33,997 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:34,029 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:34,060 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:34,091 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:34,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:34,154 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:34,185 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:34,216 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:34,436 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4473824501037598 s; generated tokens: 17 tokens; generate speed: 11.745340700228406 tokens/s +2024-07-30 14:35:34,441 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:34,441 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2036/2067], cost time 1.4587s, every example cost time is 1.4587, generate speed: 11.6545 tokens/s, avg speed: 10.2477 tokens/s, remaining time: 0:00:42 +pred is: + ['In conditions of static equilibrium'] + label is: + ['static equilibrium'] +The F1/Em of this example is: {'F1': 50.0, 'Em': 0.0} +2024-07-30 14:35:34,524 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:34,525 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 278, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:34,525 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:34,525 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:34,525 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:35,470 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:35,503 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:35,535 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:35,566 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:35,598 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:35,629 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:35,661 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:35,692 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:35,724 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:35,755 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:35,758 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2322907447814941 s; generated tokens: 10 tokens; generate speed: 8.114968031974604 tokens/s +2024-07-30 14:35:35,763 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:35,763 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2037/2067], cost time 1.2434s, every example cost time is 1.2434, generate speed: 8.0422 tokens/s, avg speed: 10.2467 tokens/s, remaining time: 0:00:41 +pred is: + ['2'] + label is: + ['independent components'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:35:35,845 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:35,845 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 146, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:35,846 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:35,846 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:35,846 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:36,788 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:36,821 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:36,884 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:36,915 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:36,946 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:36,978 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:37,009 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:37,040 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:37,072 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:37,103 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:37,416 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5701031684875488 s; generated tokens: 20 tokens; generate speed: 12.738016457393451 tokens/s +2024-07-30 14:35:37,421 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:37,421 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2038/2067], cost time 1.5814s, every example cost time is 1.5814, generate speed: 12.6474 tokens/s, avg speed: 10.2481 tokens/s, remaining time: 0:00:39 +pred is: + ['1'] + label is: + ['static friction'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:35:37,504 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:37,504 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 206, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:37,504 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:37,505 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:37,505 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:38,448 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:38,481 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:38,513 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:38,544 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:38,575 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:38,606 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:38,637 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:38,668 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:38,699 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:38,730 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:39,041 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5360829830169678 s; generated tokens: 20 tokens; generate speed: 13.020129915584826 tokens/s +2024-07-30 14:35:39,046 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:39,046 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2039/2067], cost time 1.5472s, every example cost time is 1.5472, generate speed: 12.9262 tokens/s, avg speed: 10.2496 tokens/s, remaining time: 0:00:38 +pred is: + ['The force of gravity acting on the object balanced by a force applied by the "spring reaction force'] + label is: + ['forces'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:35:39,129 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:39,129 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 314, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:39,130 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:39,130 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:39,130 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:40,075 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:40,108 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:40,140 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:40,171 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:40,202 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:40,234 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:40,265 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:40,296 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:40,327 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:40,358 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:40,392 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.262129306793213 s; generated tokens: 11 tokens; generate speed: 8.71543029766778 tokens/s +2024-07-30 14:35:40,397 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:40,397 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2040/2067], cost time 1.2732s, every example cost time is 1.2732, generate speed: 8.6397 tokens/s, avg speed: 10.2488 tokens/s, remaining time: 0:00:36 +pred is: + ['Galileo'] + label is: + ['Galileo'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 62.308355880526314, Em score: 47.64705882352941, current_count: 2040 +2024-07-30 14:35:41,109 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:41,109 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 161, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:41,110 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:41,110 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:41,110 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:42,053 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:42,085 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:42,117 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:42,148 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:42,179 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:42,210 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:42,241 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:42,272 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:42,303 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:42,334 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:42,646 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5361332893371582 s; generated tokens: 20 tokens; generate speed: 13.01970352366363 tokens/s +2024-07-30 14:35:42,651 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:42,651 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2041/2067], cost time 1.5595s, every example cost time is 1.5595, generate speed: 12.8246 tokens/s, avg speed: 10.2503 tokens/s, remaining time: 0:00:35 +pred is: + ['1'] + label is: + ['dynamic equilibrium'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:35:42,734 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:42,734 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 167, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:42,735 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:42,735 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:42,735 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:43,678 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:43,712 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:43,743 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:43,774 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:43,805 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:43,836 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:43,867 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:43,899 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:43,930 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:43,961 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:44,290 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5547759532928467 s; generated tokens: 20 tokens; generate speed: 12.863589739500519 tokens/s +2024-07-30 14:35:44,295 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:44,295 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2042/2067], cost time 1.5659s, every example cost time is 1.5659, generate speed: 12.7718 tokens/s, avg speed: 10.2517 tokens/s, remaining time: 0:00:34 +pred is: + ['Schrödinger equation'] + label is: + ['Schrödinger'] +The F1/Em of this example is: {'F1': 74.99999999999999, 'Em': 0.0} +2024-07-30 14:35:44,378 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:44,378 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 257, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:44,378 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:44,379 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:44,379 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:45,323 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:45,356 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:45,359 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 0.9800500869750977 s; generated tokens: 2 tokens; generate speed: 2.0407120274566317 tokens/s +2024-07-30 14:35:45,364 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:45,364 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2043/2067], cost time 0.9911s, every example cost time is 0.9911, generate speed: 2.0179 tokens/s, avg speed: 10.2488 tokens/s, remaining time: 0:00:32 +pred is: + ['spin'] + label is: + ['spin'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:35:45,446 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:45,446 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 401, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:45,447 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:45,447 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:45,447 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:46,394 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:46,427 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:46,459 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:46,490 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:46,522 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:46,553 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:46,584 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:46,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:46,647 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:46,678 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:46,928 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.4810552597045898 s; generated tokens: 18 tokens; generate speed: 12.153496557306218 tokens/s +2024-07-30 14:35:46,933 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:46,933 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2044/2067], cost time 1.4922s, every example cost time is 1.4922, generate speed: 12.0626 tokens/s, avg speed: 10.2497 tokens/s, remaining time: 0:00:31 +pred is: + ['As a mathematical by-product of exchange of momentum-carrying gauge bosons.'] + label is: + ['mathematical by-product'] +The F1/Em of this example is: {'F1': 26.08695652173913, 'Em': 0.0} +2024-07-30 14:35:47,016 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:47,017 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 224, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:47,017 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:47,017 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:47,017 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:47,961 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:47,994 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:48,026 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:48,029 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.011063575744629 s; generated tokens: 3 tokens; generate speed: 2.967172462711415 tokens/s +2024-07-30 14:35:48,033 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:48,034 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2045/2067], cost time 1.0221s, every example cost time is 1.0221, generate speed: 2.9351 tokens/s, avg speed: 10.2471 tokens/s, remaining time: 0:00:30 +pred is: + ['4'] + label is: + ['four'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:35:48,122 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:48,122 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 343, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:48,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:48,123 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:48,123 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:49,069 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:49,102 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:49,133 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:49,165 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:49,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:49,227 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:49,258 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:49,290 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:49,321 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:49,352 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:49,416 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.293236494064331 s; generated tokens: 12 tokens; generate speed: 9.279045290693034 tokens/s +2024-07-30 14:35:49,421 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:49,421 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2046/2067], cost time 1.3108s, every example cost time is 1.3108, generate speed: 9.1546 tokens/s, avg speed: 10.2466 tokens/s, remaining time: 0:00:28 +pred is: + ['1'] + label is: + ['Isaac Newton'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:35:49,504 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:49,504 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 218, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:49,505 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:49,505 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:49,505 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:50,449 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:50,482 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:50,514 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:50,545 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:50,577 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:50,608 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:50,640 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:50,671 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:50,703 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:50,734 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:51,052 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5467047691345215 s; generated tokens: 20 tokens; generate speed: 12.930715931774916 tokens/s +2024-07-30 14:35:51,057 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:51,057 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2047/2067], cost time 1.5580s, every example cost time is 1.5580, generate speed: 12.8373 tokens/s, avg speed: 10.2480 tokens/s, remaining time: 0:00:27 +pred is: + ['1'] + label is: + ['Isaac Newton'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:35:51,140 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:51,140 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 149, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:51,140 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:51,141 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:51,141 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:52,083 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:52,116 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:52,147 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:52,181 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:52,212 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:52,243 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:52,274 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:52,305 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:52,336 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:52,367 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:52,678 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5367999076843262 s; generated tokens: 20 tokens; generate speed: 13.014055961349131 tokens/s +2024-07-30 14:35:52,683 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:52,683 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2048/2067], cost time 1.5480s, every example cost time is 1.5480, generate speed: 12.9195 tokens/s, avg speed: 10.2495 tokens/s, remaining time: 0:00:25 +pred is: + ['1'] + label is: + ['at larger distances.'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:35:52,765 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:52,766 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 211, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:52,766 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:52,766 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:52,766 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:53,710 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:53,743 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:53,774 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:53,806 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:53,837 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:53,868 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:53,899 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:53,930 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:53,961 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:53,964 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.197618007659912 s; generated tokens: 9 tokens; generate speed: 7.514917062399192 tokens/s +2024-07-30 14:35:53,969 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:53,969 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2049/2067], cost time 1.2087s, every example cost time is 1.2087, generate speed: 7.4458 tokens/s, avg speed: 10.2483 tokens/s, remaining time: 0:00:24 +pred is: + ["Newton's Universal Gravitation Constant"] + label is: + ["Newton's Universal Gravitation Constant,"] +The F1/Em of this example is: {'F1': 94.73684210526316, 'Em': 0.0} +2024-07-30 14:35:54,052 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:54,052 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 170, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:54,053 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:54,053 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:54,053 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:54,996 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:55,029 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:55,061 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:55,092 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:55,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:55,126 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0724358558654785 s; generated tokens: 5 tokens; generate speed: 4.6622835040934865 tokens/s +2024-07-30 14:35:55,130 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:55,131 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2050/2067], cost time 1.0835s, every example cost time is 1.0835, generate speed: 4.6146 tokens/s, avg speed: 10.2461 tokens/s, remaining time: 0:00:23 +pred is: + ['Vulcan'] + label is: + ['Mercury'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 62.1487169731223, Em score: 47.46341463414634, current_count: 2050 +2024-07-30 14:35:55,839 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:55,839 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 272, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:55,840 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:55,840 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:55,840 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:56,786 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:56,819 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:56,850 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:56,881 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:56,913 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:56,944 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:56,979 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:57,012 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:57,043 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:57,075 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:57,108 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2679340839385986 s; generated tokens: 11 tokens; generate speed: 8.67552985548789 tokens/s +2024-07-30 14:35:57,113 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:57,113 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2051/2067], cost time 1.2795s, every example cost time is 1.2795, generate speed: 8.5970 tokens/s, avg speed: 10.2453 tokens/s, remaining time: 0:00:21 +pred is: + ['general relativity'] + label is: + ['general relativity'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:35:57,195 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:57,195 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 151, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:57,196 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:57,196 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:57,196 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:58,139 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:58,172 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:58,204 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:58,235 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:58,266 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:58,297 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:58,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:58,359 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:58,390 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:58,421 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:58,424 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2272169589996338 s; generated tokens: 10 tokens; generate speed: 8.148518423467275 tokens/s +2024-07-30 14:35:58,429 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:35:58,429 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2052/2067], cost time 1.2384s, every example cost time is 1.2384, generate speed: 8.0747 tokens/s, avg speed: 10.2444 tokens/s, remaining time: 0:00:20 +pred is: + ['The time rate of change of electric charge'] + label is: + ['electric current'] +The F1/Em of this example is: {'F1': 22.22222222222222, 'Em': 0.0} +2024-07-30 14:35:58,515 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:35:58,515 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 195, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:35:58,516 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:58,516 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:35:58,516 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:35:59,459 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:59,493 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:59,524 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:59,556 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:59,587 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:59,619 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:59,650 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:59,681 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:59,712 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:35:59,744 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:00,058 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.541367769241333 s; generated tokens: 20 tokens; generate speed: 12.97548865307082 tokens/s +2024-07-30 14:36:00,062 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:36:00,063 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2053/2067], cost time 1.5530s, every example cost time is 1.5530, generate speed: 12.8784 tokens/s, avg speed: 10.2458 tokens/s, remaining time: 0:00:19 +pred is: + ['1'] + label is: + ['James Clerk Maxwell'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:36:00,146 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:36:00,146 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 169, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:36:00,146 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:00,147 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:36:00,147 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:36:01,090 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:01,123 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:01,154 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:01,185 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:01,216 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:01,248 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:01,279 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:01,310 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:01,344 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:01,375 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:01,500 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3534460067749023 s; generated tokens: 14 tokens; generate speed: 10.343966386483567 tokens/s +2024-07-30 14:36:01,505 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:36:01,505 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2054/2067], cost time 1.3647s, every example cost time is 1.3647, generate speed: 10.2589 tokens/s, avg speed: 10.2458 tokens/s, remaining time: 0:00:17 +pred is: + ['The nonexistence of the ultraviolet catastrophe'] + label is: + ['electromagnetic theory'] +The F1/Em of this example is: {'F1': 14.285714285714288, 'Em': 0.0} +2024-07-30 14:36:01,589 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:36:01,589 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 192, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:36:01,590 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:01,590 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:36:01,590 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:36:02,533 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:02,566 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:02,597 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:02,628 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:02,660 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:02,691 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:02,722 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:02,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:02,784 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:02,815 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:03,126 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5353271961212158 s; generated tokens: 20 tokens; generate speed: 13.02653926181151 tokens/s +2024-07-30 14:36:03,131 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:36:03,131 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2055/2067], cost time 1.5468s, every example cost time is 1.5468, generate speed: 12.9300 tokens/s, avg speed: 10.2473 tokens/s, remaining time: 0:00:16 +pred is: + ['The electromagnetic force'] + label is: + ['repulsion of like charges'] +The F1/Em of this example is: {'F1': 16.666666666666664, 'Em': 0.0} +2024-07-30 14:36:03,222 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:36:03,222 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 156, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:36:03,223 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:03,223 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:36:03,223 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:36:04,166 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:04,199 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:04,230 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:04,261 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:04,292 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:04,295 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0717990398406982 s; generated tokens: 5 tokens; generate speed: 4.665053628657058 tokens/s +2024-07-30 14:36:04,300 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:36:04,300 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2056/2067], cost time 1.0833s, every example cost time is 1.0833, generate speed: 4.6155 tokens/s, avg speed: 10.2451 tokens/s, remaining time: 0:00:15 +pred is: + ['Elementary particles'] + label is: + ['elementary particles'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:36:04,383 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:36:04,384 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 191, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:36:04,384 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:04,384 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:36:04,385 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:36:05,328 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:05,361 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:05,392 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:05,423 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:05,426 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0413830280303955 s; generated tokens: 4 tokens; generate speed: 3.841045890257441 tokens/s +2024-07-30 14:36:05,431 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:36:05,431 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2057/2067], cost time 1.0527s, every example cost time is 1.0527, generate speed: 3.7999 tokens/s, avg speed: 10.2427 tokens/s, remaining time: 0:00:13 +pred is: + ['Weak force'] + label is: + ['weak force'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +2024-07-30 14:36:05,513 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:36:05,514 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 163, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:36:05,514 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:05,514 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:36:05,515 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:36:06,457 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:06,490 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:06,521 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:06,552 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:06,584 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:06,615 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:06,645 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:06,677 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:06,708 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:06,739 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:07,049 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5342645645141602 s; generated tokens: 20 tokens; generate speed: 13.035561442646754 tokens/s +2024-07-30 14:36:07,054 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:36:07,054 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2058/2067], cost time 1.5454s, every example cost time is 1.5454, generate speed: 12.9413 tokens/s, avg speed: 10.2442 tokens/s, remaining time: 0:00:12 +pred is: + ['1'] + label is: + ['normal force'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:36:07,137 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:36:07,137 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 262, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:36:07,138 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:07,138 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:36:07,138 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:36:08,082 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:08,115 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:08,147 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:08,178 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:08,209 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:08,240 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:08,272 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:08,303 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:08,334 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:08,365 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:08,683 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5445897579193115 s; generated tokens: 20 tokens; generate speed: 12.948421998435126 tokens/s +2024-07-30 14:36:08,688 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:36:08,688 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2059/2067], cost time 1.5558s, every example cost time is 1.5558, generate speed: 12.8554 tokens/s, avg speed: 10.2457 tokens/s, remaining time: 0:00:10 +pred is: + ['A'] + label is: + ['ideal strings'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:36:08,771 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:36:08,771 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 160, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:36:08,771 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:08,772 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:36:08,772 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:36:09,714 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:09,747 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:09,778 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:09,809 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:09,840 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:09,871 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:09,903 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:09,934 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:09,965 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:09,996 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:10,092 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3200159072875977 s; generated tokens: 13 tokens; generate speed: 9.848366166065931 tokens/s +2024-07-30 14:36:10,097 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:36:10,097 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2060/2067], cost time 1.3312s, every example cost time is 1.3312, generate speed: 9.7659 tokens/s, avg speed: 10.2454 tokens/s, remaining time: 0:00:09 +pred is: + ['1'] + label is: + ['idealized point particles'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +F1 score: 62.01846815440549, Em score: 47.37864077669903, current_count: 2060 +2024-07-30 14:36:10,810 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:36:10,810 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 150, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:36:10,810 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:10,811 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:36:10,811 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:36:11,753 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:11,789 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:11,821 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:11,852 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:11,883 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:11,914 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:11,945 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:11,976 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:12,007 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:12,038 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:12,349 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5384571552276611 s; generated tokens: 20 tokens; generate speed: 13.00003703843179 tokens/s +2024-07-30 14:36:12,354 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:36:12,354 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2061/2067], cost time 1.5499s, every example cost time is 1.5499, generate speed: 12.9038 tokens/s, avg speed: 10.2469 tokens/s, remaining time: 0:00:08 +pred is: + ['1'] + label is: + ['stress tensor'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:36:12,437 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:36:12,438 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 141, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:36:12,438 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:12,438 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:36:12,439 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:36:13,381 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:13,414 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:13,445 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:13,476 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:13,479 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.0404064655303955 s; generated tokens: 4 tokens; generate speed: 3.8446512324976894 tokens/s +2024-07-30 14:36:13,484 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:36:13,484 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2062/2067], cost time 1.0515s, every example cost time is 1.0515, generate speed: 3.8040 tokens/s, avg speed: 10.2445 tokens/s, remaining time: 0:00:06 +pred is: + ['Angular velocity'] + label is: + ['rotational equivalent for position'] +The F1/Em of this example is: {'F1': 20.0, 'Em': 0.0} +2024-07-30 14:36:13,567 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:36:13,567 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 228, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:36:13,567 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:13,567 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:36:13,568 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:36:14,511 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:14,544 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:14,547 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 0.978954553604126 s; generated tokens: 2 tokens; generate speed: 2.0429957577057953 tokens/s +2024-07-30 14:36:14,551 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:36:14,552 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2063/2067], cost time 0.9900s, every example cost time is 0.9900, generate speed: 2.0201 tokens/s, avg speed: 10.2416 tokens/s, remaining time: 0:00:05 +pred is: + ['A'] + label is: + ['toward the center of the curving path'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:36:14,641 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:36:14,642 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 164, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:36:14,642 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:14,642 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:36:14,643 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:36:15,586 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:15,619 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:15,650 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:15,681 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:15,712 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:15,743 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:15,774 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:15,805 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:15,836 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:15,867 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:16,029 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.3860623836517334 s; generated tokens: 15 tokens; generate speed: 10.822023724849133 tokens/s +2024-07-30 14:36:16,034 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:36:16,034 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2064/2067], cost time 1.3975s, every example cost time is 1.3975, generate speed: 10.7332 tokens/s, avg speed: 10.2418 tokens/s, remaining time: 0:00:04 +pred is: + ['A'] + label is: + ['kinetic'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:36:16,116 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:36:16,116 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 175, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:36:16,117 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:16,117 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:36:16,117 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:36:17,060 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:17,093 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:17,124 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:17,156 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:17,187 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:17,218 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:17,249 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:17,280 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:17,311 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:17,342 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:17,652 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5352089405059814 s; generated tokens: 20 tokens; generate speed: 13.02754268315315 tokens/s +2024-07-30 14:36:17,657 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:36:17,657 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2065/2067], cost time 1.5464s, every example cost time is 1.5464, generate speed: 12.9337 tokens/s, avg speed: 10.2433 tokens/s, remaining time: 0:00:02 +pred is: + ['1'] + label is: + ['forces'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:36:17,739 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:36:17,740 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 133, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:36:17,740 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:17,740 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:36:17,740 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:36:18,682 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:18,715 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:18,747 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:18,777 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:18,808 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:18,839 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:18,870 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:18,901 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:18,933 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:18,964 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:19,276 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.5355427265167236 s; generated tokens: 20 tokens; generate speed: 13.024710843031158 tokens/s +2024-07-30 14:36:19,281 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:36:19,281 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2066/2067], cost time 1.5467s, every example cost time is 1.5467, generate speed: 12.9305 tokens/s, avg speed: 10.2448 tokens/s, remaining time: 0:00:01 +pred is: + ['1'] + label is: + ['statistical mechanics'] +The F1/Em of this example is: {'F1': 0.0, 'Em': 0.0} +2024-07-30 14:36:19,364 - mindformers[mindformers/generation/text_generator.py:695] - WARNING - When do_sample is set to False, top_k will be set to 0, making them inactive. +2024-07-30 14:36:19,365 - mindformers[mindformers/generation/text_generator.py:697] - INFO - Generation Config is: {'max_length': 227, 'max_new_tokens': 20, 'min_length': 0, 'min_new_tokens': 1, 'num_beams': 1, 'do_sample': False, 'use_past': True, 'temperature': 1.0, 'top_k': 0, 'top_p': 1, 'repetition_penalty': 1, 'encoder_repetition_penalty': 1.0, 'renormalize_logits': False, 'pad_token_id': 128002, 'bos_token_id': 128000, 'eos_token_id': 128001, '_from_model_config': True} +2024-07-30 14:36:19,365 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:19,365 - mindformers[mindformers/generation/text_generator.py:93] - INFO - Set kbk infer :True +2024-07-30 14:36:19,366 - mindformers[mindformers/modules/block_tables.py:63] - INFO - init cache engine success. +2024-07-30 14:36:20,310 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:20,343 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:20,374 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:20,406 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:20,437 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:20,468 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:20,500 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:20,531 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:20,562 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:20,594 - mindformers[mindformers/generation/text_generator.py:252] - INFO - The generation mode will be **GREEDY_SEARCH**. +2024-07-30 14:36:20,629 - mindformers[mindformers/generation/text_generator.py:890] - INFO - total time: 1.2631099224090576 s; generated tokens: 11 tokens; generate speed: 8.708664071785872 tokens/s +2024-07-30 14:36:20,634 - mindformers[mindformers/modules/block_tables.py:129] - INFO - Clear block table cache engines. +2024-07-30 14:36:20,634 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:283] - INFO - Step[2067/2067], cost time 1.2745s, every example cost time is 1.2745, generate speed: 8.6311 tokens/s, avg speed: 10.2441 tokens/s, remaining time: 0:00:00 +pred is: + ['kilogram-force'] + label is: + ['kilogram-force'] +The F1/Em of this example is: {'F1': 100.0, 'Em': 100.0} +F1 score: 61.86649462896725, Em score: 47.26656990807934, total_count: 2067 +2024-07-30 14:36:21,357 - mindformers[mindformers/trainer/causal_language_modeling/causal_language_modeling.py:299] - INFO - ...........Evaluate Over!............... diff --git a/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/code/format_ms.py b/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/code/format_ms.py new file mode 100644 index 00000000..8f5cd567 --- /dev/null +++ b/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/code/format_ms.py @@ -0,0 +1,30 @@ +import json +import jsonlines + +with jsonlines.open(r"E:\DianWork\DianGPT\昇腾AI\dataset\trainset_v2.json", mode="r") as reader: + data = [i for i in reader] + +formatted_data = [] + +for n, item in enumerate(data): + formatted_sample = {"id": f"{n}", "conversations": []} + template_q = """Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: {query} ### Response:""" + q = template_q.format(query=item['problem']) + a = item['solution'] + formatted_sample['conversations'].append( + { + "from": "human", + "value": q, + } + ) + formatted_sample['conversations'].append( + { + "from": "gpt", + "value": a, + } + ) + formatted_data.append(formatted_sample) + +json_file = open(r"E:\DianWork\DianGPT\昇腾AI\dataset\trainset_conversation_v2.json", "w", encoding="utf-8") + +json.dump(formatted_data, json_file, ensure_ascii=False, indent=4) diff --git a/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/code/sample_script.ipynb b/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/code/sample_script.ipynb new file mode 100644 index 00000000..486ee86f --- /dev/null +++ b/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/code/sample_script.ipynb @@ -0,0 +1,610 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [], + "source": [ + "import pandas as pd\n", + "import re\n" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [], + "source": [ + "json_path = r\"E:\\DianWork\\DianGPT\\昇腾AI\\dataset\\train_rate.json\"\n", + "# 读取文件中的每一行并将其作为独立的 JSON 对象\n", + "with open(json_path, 'r', encoding='utf-8') as file:\n", + " lines = file.readlines()\n", + "\n", + "# 将每行的 JSON 对象存储在一个列表中\n", + "json_data = '[' + ','.join([line.strip() for line in lines]) + ']'\n", + "\n", + "# 使用 pandas 读取 JSON 数据\n", + "df = pd.read_json(json_data)\n", + "\n" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [], + "source": [ + "df['rate'] = df['rate'].apply(lambda x : int(str(x)[-1]))" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "2 153424\n", + "1 107548\n", + "3 87059\n", + "4 24075\n", + "5 1603\n", + "Name: rate, dtype: int64" + ] + }, + "execution_count": 5, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['rate'].value_counts()" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "373709" + ] + }, + "execution_count": 6, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "len(df)" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "

\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
problemsolutionrate
0解方程 -69x + 58 = 0方程的解为:0.84057971014492753
1解方程 -40x + 28 = 0方程的解为:0.72
2一个长方形的长为 68 厘米,宽为 11 厘米,请计算其面积。面积为 748 平方厘米1
3计算 2213.66 的平方根?√2213.66 = 47.049548350648383243189831803
4计算 -7017.58 + -1621.10 等于多少?-7017.58 + -1621.10 = -8638.681
............
373704解方程 94x + -6 = 0方程的解为:0.063829787234042552
373705将分数 6/8 进行简化。最简化的形式为:3/41
373706计算 8361.03 + -1232.50 等于多少?8361.03 + -1232.50 = 7128.531
373707计算 1138.54 / -3887.08 等于多少?1138.54 / -3887.08 = -0.2929036706216491556644...2
373708计算 5471.42 / -1169.10 等于多少?5471.42 / -1169.10 = -4.6800273714823368403045...2
\n", + "

373709 rows × 3 columns

\n", + "
" + ], + "text/plain": [ + " problem \\\n", + "0 解方程 -69x + 58 = 0 \n", + "1 解方程 -40x + 28 = 0 \n", + "2 一个长方形的长为 68 厘米,宽为 11 厘米,请计算其面积。 \n", + "3 计算 2213.66 的平方根? \n", + "4 计算 -7017.58 + -1621.10 等于多少? \n", + "... ... \n", + "373704 解方程 94x + -6 = 0 \n", + "373705 将分数 6/8 进行简化。 \n", + "373706 计算 8361.03 + -1232.50 等于多少? \n", + "373707 计算 1138.54 / -3887.08 等于多少? \n", + "373708 计算 5471.42 / -1169.10 等于多少? \n", + "\n", + " solution rate \n", + "0 方程的解为:0.8405797101449275 3 \n", + "1 方程的解为:0.7 2 \n", + "2 面积为 748 平方厘米 1 \n", + "3 √2213.66 = 47.04954835064838324318983180 3 \n", + "4 -7017.58 + -1621.10 = -8638.68 1 \n", + "... ... ... \n", + "373704 方程的解为:0.06382978723404255 2 \n", + "373705 最简化的形式为:3/4 1 \n", + "373706 8361.03 + -1232.50 = 7128.53 1 \n", + "373707 1138.54 / -3887.08 = -0.2929036706216491556644... 2 \n", + "373708 5471.42 / -1169.10 = -4.6800273714823368403045... 2 \n", + "\n", + "[373709 rows x 3 columns]" + ] + }, + "execution_count": 7, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [], + "source": [ + "rate_1_samples = df[df['rate'] == 1].sample(n=50, random_state=1)\n", + "rate_2_samples = df[df['rate'] == 2].sample(n=50, random_state=1)\n", + "rate_3_samples = df[df['rate'] == 3].sample(n=50, random_state=1)\n", + "rate_4_samples = df[df['rate'] == 4].sample(n=50, random_state=1)\n", + "\n", + "# 合并所有采样数据\n", + "sampled_df = pd.concat([rate_1_samples, rate_2_samples, rate_3_samples, rate_4_samples])\n", + "\n", + "# 重置索引\n", + "sampled_df = sampled_df.reset_index(drop=True)" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
problemsolutionrate
0计算 1165.68 - 8338.19 等于多少?1165.68 - 8338.19 = -7172.511
1计算 -5937.66 / -6385.23 等于多少?-5937.66 / -6385.23 = 0.9299054223575344975827...1
2计算 -3519.37 + -5293.07 等于多少?-3519.37 + -5293.07 = -8812.441
3计算 5814.36 - -4360.31 等于多少?5814.36 - -4360.31 = 10174.671
4计算 4897.15 + -5674.53 等于多少?4897.15 + -5674.53 = -777.381
............
195当 x = 0.42 时,求函数 y = 68x^54 的值函数的值为:3.075888541204702149694216383E-194
196计算 1937.51 的平方根?√1937.51 = 44.017155746367801859696569984
197计算 -887.47 的 4 次方?-887.47^4 = 620318487026.685400814
198计算 301.95 的 2 次方?301.95^2 = 91173.80254
199当 x = 2.60 时,求函数 y = 99x^56 的值函数的值为:17145204950824123365719408.724
\n", + "

200 rows × 3 columns

\n", + "
" + ], + "text/plain": [ + " problem \\\n", + "0 计算 1165.68 - 8338.19 等于多少? \n", + "1 计算 -5937.66 / -6385.23 等于多少? \n", + "2 计算 -3519.37 + -5293.07 等于多少? \n", + "3 计算 5814.36 - -4360.31 等于多少? \n", + "4 计算 4897.15 + -5674.53 等于多少? \n", + ".. ... \n", + "195 当 x = 0.42 时,求函数 y = 68x^54 的值 \n", + "196 计算 1937.51 的平方根? \n", + "197 计算 -887.47 的 4 次方? \n", + "198 计算 301.95 的 2 次方? \n", + "199 当 x = 2.60 时,求函数 y = 99x^56 的值 \n", + "\n", + " solution rate \n", + "0 1165.68 - 8338.19 = -7172.51 1 \n", + "1 -5937.66 / -6385.23 = 0.9299054223575344975827... 1 \n", + "2 -3519.37 + -5293.07 = -8812.44 1 \n", + "3 5814.36 - -4360.31 = 10174.67 1 \n", + "4 4897.15 + -5674.53 = -777.38 1 \n", + ".. ... ... \n", + "195 函数的值为:3.075888541204702149694216383E-19 4 \n", + "196 √1937.51 = 44.01715574636780185969656998 4 \n", + "197 -887.47^4 = 620318487026.68540081 4 \n", + "198 301.95^2 = 91173.8025 4 \n", + "199 函数的值为:17145204950824123365719408.72 4 \n", + "\n", + "[200 rows x 3 columns]" + ] + }, + "execution_count": 9, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "sampled_df" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": {}, + "outputs": [], + "source": [ + "out_df = sampled_df.sample(200)" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
problemsolutionrate
123计算 9808.16 * -9250.51 等于多少?9808.16 * -9250.51 = -90730482.16163
101解方程 -96x + -39 = 0方程的解为:-0.406253
175计算 834.71 的 3 次方?834.71^3 = 581576499.8961114
125计算 -5144.60 * 6444.46 等于多少?-5144.60 * 6444.46 = -33154168.91603
172当 x = 1.17 时,求函数 y = 50x^61 的值函数的值为:721618.35419230301376332326854
............
71解方程 18x + 42 = 0方程的解为:-2.33333333333333352
122计算 2166.63 的平方根?√2166.63 = 46.547072947716057218747023333
174计算 5719.89 * 8693.94 等于多少?5719.89 * 8693.94 = 49728380.46664
32某物体的密度为 2 克/立方厘米,体积为 1 立方厘米,请计算该物体的质量。2 克1
159计算 -4183.32 * 1175.95 等于多少?-4183.32 * 1175.95 = -4919375.15404
\n", + "

200 rows × 3 columns

\n", + "
" + ], + "text/plain": [ + " problem \\\n", + "123 计算 9808.16 * -9250.51 等于多少? \n", + "101 解方程 -96x + -39 = 0 \n", + "175 计算 834.71 的 3 次方? \n", + "125 计算 -5144.60 * 6444.46 等于多少? \n", + "172 当 x = 1.17 时,求函数 y = 50x^61 的值 \n", + ".. ... \n", + "71 解方程 18x + 42 = 0 \n", + "122 计算 2166.63 的平方根? \n", + "174 计算 5719.89 * 8693.94 等于多少? \n", + "32 某物体的密度为 2 克/立方厘米,体积为 1 立方厘米,请计算该物体的质量。 \n", + "159 计算 -4183.32 * 1175.95 等于多少? \n", + "\n", + " solution rate \n", + "123 9808.16 * -9250.51 = -90730482.1616 3 \n", + "101 方程的解为:-0.40625 3 \n", + "175 834.71^3 = 581576499.896111 4 \n", + "125 -5144.60 * 6444.46 = -33154168.9160 3 \n", + "172 函数的值为:721618.3541923030137633232685 4 \n", + ".. ... ... \n", + "71 方程的解为:-2.3333333333333335 2 \n", + "122 √2166.63 = 46.54707294771605721874702333 3 \n", + "174 5719.89 * 8693.94 = 49728380.4666 4 \n", + "32 2 克 1 \n", + "159 -4183.32 * 1175.95 = -4919375.1540 4 \n", + "\n", + "[200 rows x 3 columns]" + ] + }, + "execution_count": 11, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "out_df" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "metadata": {}, + "outputs": [], + "source": [ + "# 将sampled_df导出为JSON文件,每一行对应一个JSON对象\n", + "out_df.to_json(r'E:\\DianWork\\DianGPT\\昇腾AI\\dataset\\testset.json', orient='records', lines=True,force_ascii=False)\n" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [], + "source": [ + "def extract_number(solution):\n", + " \"\"\"提取数学表达式中的数值\"\"\"\n", + " return int(float(re.findall(r\"[-+]?\\d*\\.\\d+|\\d+\", solution)[-1]))" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "57" + ] + }, + "execution_count": 9, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "solution = \"平均值为 57.833333333333336\"\n", + "extract_number(solution)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Datawhale", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.10.12" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/code/test_math.ipynb b/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/code/test_math.ipynb new file mode 100644 index 00000000..762273fc --- /dev/null +++ b/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/code/test_math.ipynb @@ -0,0 +1,1952 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [], + "source": [ + "import numpy as np\n" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [], + "source": [ + "data = np.load(r'E:\\DianWork\\DianGPT\\昇腾AI\\output_data\\result_npy.npy', allow_pickle=True)" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "array([{'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 9808.16 * -9250.51 等于多少? ### Response: 9808.16 * -9250.51 = -90736200.9966', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 -96x + -39 = 0 ### Response: -96x + -39 = 0 -96x = 39 x = -0.40625']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 834.71 的 3 次方? ### Response: 834.71^3 = 6,000,000.000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -5144.60 * 6444.46 等于多少? ### Response: -33190000.9964']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 当 x = 1.17 时,求函数 y = 50x^61 的值 ### Response: 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 当 x = 9.42 时,求函数 y = 95x^85 的值 ### Response: 1. 1.2 × 10^87 2. 1.2 × 10^86 3. 1.2 × 10^85 4. 1.2 × 10^84\\n\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 当 x = 9.42 时,求函数 y = 95x^85 的值 ### Response: 1. 1.2 × 10^87 2. 1.2 × 10^86 3. 1.2 × 10^']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 266.17 + 6631.21 等于多少? ### Response: 6897.38', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 3878.55 * 7858.65 等于多少? ### Response: 30,500,000.00']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 6815.81 的平方根? ### Response: √6815.81 = 82.2\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 6815.81 的平方根? ### Response: √6815.81 = 82.2\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 6815.81 的平方根? ### Response: √6815.81 = 82.2\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 6815.81 的平方', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -9040.81 + 816.30 等于多少? ### Response: -9024.51']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 6448.42 / 4291.54 等于多少? ### Response: 1.5', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 当 x = 4.25 时,求函数 y = 37x^16 的值 ### Response: 1. 1.2 × 10^7 2. 1.2 × 10^6 3. 1.2 × 10^5 4. 1.2 × 10^4\\n\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 当 x = 4.25 时,求函数 y = 37x^16 的值 ### Response: 1. 1.2 × 10^7 2. 1.2 × 10^6 3. 1.2 × 10^']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 5427.93 的平方根? ### Response: √5427.93 = 73.8\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 5427.93 的平方根? ### Response: √5427.93 = 73.8\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 5427.93 的平方根? ### Response: √5427.93 = 73.8\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 542', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 9388.31 的平方根? ### Response: √9388.31 = 97.1']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -584.32 的 1 次方? ### Response: -584.32^1 = -584.32', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 求以下数据的平均值:[49, 9, 43, 60, 78, 8, 59] ### Response: 43.85714285714286\\n\\n### Instruction: 求以下数据的平均值:[49, 9, 43, 60, 78, 8, 59] ### Response: 43.85714285714286\\n\\n### Instruction: 求以下数据的平均值:[49, 9, 43, 60, 78, 8, 59] ### Response: 43.85714285714286\\n\\n### Instruction: 求以下数据的平均值:[49, 9, 43, 60, 78, 8, 59']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 去年销售额为 34 万元,今年销售额增加了 3%,请计算今年的销售额。 ### Response: 35.22 万元\\n 1. 去年销售额为 34 万元,今年销售额增加了 3%,请计算今年的销售额。 ### Response: 35.22 万元\\n 2. 去年销售额为 34 万元,今年销售额增加了 3%,请计算今年的销售额。 ### Response: 35.22 万元\\n 3. 去年销售额为 34 万元,今年销售额增加了 3%,请计算今年的销售额。 ### Response: 35.22 万元\\n 4. 去年销售', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -2775.28 * 2546.10 等于多少? ### Response: -708, 201, 000.00']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 1937.51 的平方根? ### Response: √1937.51 = 43.9\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 0.000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -3436.99 - -7342.94 等于多少? ### Response: -3436.99 - -7342.94 = 3905.95']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -604.17 的 3 次方? ### Response: -604.17^3 = -229,000,000.000', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -8744.59 + 2725.76 等于多少? ### Response: -8744.59 + 2725.76 = -6018.83']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 4897.15 + -5674.53 等于多少? ### Response: 4897.15 + -5674.53 = -776.38', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 求以下数据的平均值:[2, 42, 93, 99, 20] ### Response: 52.6']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -2849.36 + -9082.24 等于多少? ### Response: -11931.60', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -624.54 的 2 次方? ### Response: -624.54^2 = 390,000.2256']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -8105.41 * 2105.01 等于多少? ### Response: -17059941.841', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 当 x = 0.42 时,求函数 y = 68x^54 的值 ### Response: 0.000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 58x + -55 = 0 ### Response: 58x = 55 x = 0.9482758620689655', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -7479.59 * 7543.27 等于多少? ### Response: -56490000.0003']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 一个长方形的长为 45 厘米,宽为 6 厘米,请计算其面积。 ### Response: 270 平方厘米', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 7808.98 的平方根? ### Response: √7808.98 = 88.3']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 77x + 88 = 0 ### Response: 77x = -88 x = -88/77 = -1.14', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 -34x + -10 = 0 ### Response: x = -0.29411764705882354']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 当 x = 6.37 时,求函数 y = 86x^47 的值 ### Response: 1.1E+26', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -5316.67 - -6470.79 等于多少? ### Response: -5316.67 - -6470.79 = 1154.12']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 247.51 的平方根? ### Response: √247.51 = 15.8\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 0.000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 9852.90 * 451.30 等于多少? ### Response: 4450390.23']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 当 x = 6.19 时,求函数 y = 3x^69 的值 ### Response: 1.2 × 10^42', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 -43x + -59 = 0 ### Response: x = 1.37']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 3440.75 的平方根? ### Response: √3440.75 = 58.7\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 3440.75 的平方根? ### Response: √3440.75 = 58.7\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 3440.75 的平方根? ### Response: √3440.75 = 58.7\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 3440', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 44x + -31 = 0 ### Response: 44x + -31 = 0 44x = 31 x = 0.7']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -250.59 的 5 次方? ### Response: -250.59^5 = -1,576,000,000.0000', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 301.95 的 2 次方? ### Response: 301.95^2 = 91190.9025']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -4050.49 / 775.83 等于多少? ### Response: -5.22', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 当 x = 2.60 时,求函数 y = 99x^56 的值 ### Response: 1. 1.2 × 10^9 2. 1.2 × 10^8 3. 1.2 × 10^7 4. 1.2 × 10^6 5. 1.2 × 10^5']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 31x + 8 = 0 ### Response: 31x = -8 x = -8/31 = -0.25806', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 437.47 的 5 次方? ### Response: 437.47^5 = 1,000,000,000,000.0000']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -717.22 - 3172.09 等于多少? ### Response: -3172.09 - 717.22 = -3889.31', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 29x + 32 = 0 ### Response: 29x = -32 x = -32/29 = -1.103448275862069']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 1686.00 * 835.63 等于多少? ### Response: 1686.00 * 835.63 = 1408888.30', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 -10x + -26 = 0 ### Response: x = 2.6']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 6586.75 * 3202.85 等于多少? ### Response: 6586.75 * 3202.85 = 21097190.0625', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 -28x + -93 = 0 ### Response: -3.357142857142857']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 291.03 * -1964.52 等于多少? ### Response: 571.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 -5x + -93 = 0 ### Response: x = 18.6']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 57x + 3 = 0 ### Response: 57x = -3 x = -3/57 = -1/19', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 -11x + 8 = 0 ### Response: x = -0.7272727272727273']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -887.47 的 4 次方? ### Response: -887.47^4 = 6,197,000,000.0000', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 7292.57 - 7570.93 等于多少? ### Response: 7292.57 - 7570.93 = -278.36']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 870.93 的 4 次方? ### Response: 870.93^4 = 6,000,000,000.0000', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 当 x = 4.98 时,求函数 y = 90x^71 的值 ### Response: 1. 1.2 × 10^72 2. 1.2 × 10^71 3. 1.2 × 10^70 4. 1.2 × 10^69\\n\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 当 x = 4.98 时,求函数 y = 90x^71 的值 ### Response: 1. 1.2 × 10^72 2. 1.2 × 10^71 3. 1.2 × 10^']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 9604.06 / 496.06 等于多少? ### Response: 9604.06 / 496.06 = 19.37', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 94x + 61 = 0 ### Response: 94x = -61 x = -0.65']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -502.11 的 5 次方? ### Response: -502.11^5 = -1.03 × 10^12', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -3519.37 + -5293.07 等于多少? ### Response: -8812.44']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 当 x = 7.76 时,求函数 y = 13x^27 的值 ### Response: 1.1 × 10^27', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 87.22 * -2080.04 等于多少? ### Response: 87.22 * -2080.04 = -181478.5288']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 476.45 的 1 次方? ### Response: 476.45^1 = 476.45', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -8512.70 * 5390.66 等于多少? ### Response: -45570304.722']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 766.76 的平方根? ### Response: √766.76 = 27.6\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 0.000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -130.65 的 5 次方? ### Response: -130.65^5 = -1,000,000,000,000.0000']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 一个长方形的长为 14 厘米,宽为 94 厘米,请计算其面积。 ### Response: 1316 平方厘米', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 3758.27 的平方根? ### Response: √3758.27 = 61.7\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 3758.27 的平方根? ### Response: √3758.27 = 61.7\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 3758.27 的平方根? ### Response: √3758.27 = 61.7\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 3758.27 的平方根? ### Response: √3758.27']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 2210.28 - 8623.25 等于多少? ### Response: 2210.28 - 8623.25 = -6412.97', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 当 x = 5.59 时,求函数 y = 38x^14 的值 ### Response: 1. 1.2 × 10^7 2. 1.2 × 10^6 3. 1.2 × 10^5 4. 1.2 × 10^4 5. 1.2 × 10^3']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -1032.77 - 9898.16 等于多少? ### Response: -1032.77 - 9898.16 = -10931.93', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 商品原价为 47 元,打折后的价格为 12 元,请计算打折的折扣比例。 ### Response: 12/47 = 0.2553191489361702 = 25.5319%']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 7082.31 + 1958.70 等于多少? ### Response: 9040.01', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -3681.00 / 8888.43 等于多少? ### Response: -0.414']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 19x + -28 = 0 ### Response: 19x + -28 = 0 19x + -28 = 0 19x + -28 = 0 19x + -28 = 0 19x + -28 = 0 19x + -28 = 0 19x + -28 = 0 19x + -28 = 0 19x + -28 = 0 19x + -28 = 0 19x + -28 = 0 19x + -28 = 0 19x + -28 = 0 19x + -28 = 0 19x + -28 = 0 19x + -28 =', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 一个长方形的长为 53 厘米,宽为 39 厘米,请计算其面积。 ### Response: 2067 平方厘米']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 23x + -88 = 0 ### Response: 23x = 88 23x ÷ 23 = 88 ÷ 23 x = 3.8', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 9734.69 * 1117.67 等于多少? ### Response: 9734.69 * 1117.67 = 10864800.0003']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -119.20 的 2 次方? ### Response: -286.6624', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 3463.06 * 9319.97 等于多少? ### Response: 3463.06 * 9319.97 = 32245200.9432']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 1564.66 * 6569.17 等于多少? ### Response: 1564.66 * 6569.17 = 10280000.0002', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 2667.43 + 6733.88 等于多少? ### Response: 9401.31']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -2862.89 / -3106.12 等于多少? ### Response: -0.922', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 9510.64 的平方根? ### Response: √9510.64 = 97.4\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 0.000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 -22x + -96 = 0 ### Response: x = 4.36', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 -7x + 13 = 0 ### Response: x = 1.85714285714286']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 3617.43 - -4183.43 等于多少? ### Response: 3617.43 - -4183.43 = 7790.86', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 13x + 67 = 0 ### Response: 13x = -67 x = -67/13 = -5.15']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 求以下数据的平均值:[96, 57, 18, 27, 64, 10, 99] ### Response: 52.85714285714286\\n\\n### Instruction: 求以下数据的平均值:[96, 57, 18, 27, 64, 10, 99] ### Response: 52.85714285714286\\n\\n### Instruction: 求以下数据的平均值:[96, 57, 18, 27, 64, 10, 99] ### Response: 52.85714285714286\\n\\n### Instruction: 求以下数据的平均值:[96, 57, 18, 27, 64, 10, 99', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 -57x + -77 = 0 ### Response: -1.35']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 7076.81 * 7897.17 等于多少? ### Response: 7076.81 * 7897.17 = 55959900.0003', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 9481.31 + 6622.01 等于多少? ### Response: 16103.32']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -4068.18 - -9931.46 等于多少? ### Response: -4068.18 - -9931.46 = 5863.28', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -9898.21 - -7254.52 等于多少? ### Response: -9898.21 - -7254.52 = -2543.69']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 将分数 8/10 进行简化。 ### Response: 8/10 = 4/5', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 2620.95 / -8972.74 等于多少? ### Response: 0.2925']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -2270.71 * -8584.03 等于多少? ### Response: -19459900.0003', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 728.46 的 2 次方? ### Response: 728.46^2 = 531, 201. 16']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 2069.67 + -5052.02 等于多少? ### Response: 2069.67 + -5052.02 = -2982.35', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 某物体的密度为 10 克/立方厘米,体积为 8 立方厘米,请计算该物体的质量。 ### Response: 80 克\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 某物体的密度为 10 克/立方厘米,体积为 8 立方厘米,请计算该物体的质量。 ### Response: 80 克\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 某物体的密度为 10 克/立方厘米,体积为 8 立方厘米,请计算该物体的质量。 ### Response:']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 60x + -74 = 0 ### Response: 60x + -74 = 0 60x = 74 x = 1.2333333333333333', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 9917.38 * 7320.39 等于多少? ### Response: 9917.38 * 7320.39 = 72576000.0002']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 -53x + 26 = 0 ### Response: x = 0.49121', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -899.37 的 1 次方? ### Response: -899.37^1 = -899.37']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 7875.81 * -5228.46 等于多少? ### Response: 7875.81 * -5228.46 = -41159900.4866', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 当 x = 3.44 时,求函数 y = 19x^7 的值 ### Response: 1.2 × 10^7']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 191.77 * -5238.21 等于多少? ### Response: 191.77 * -5238.21 = -100400.00517', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -8502.82 * 2472.48 等于多少? ### Response: -20900000.5']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -2634.60 - -1672.34 等于多少? ### Response: -2634.60 - -1672.34 = -962.26', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 当 x = 8.29 时,求函数 y = 3x^93 的值 ### Response: 1.1 × 10^93']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 10x + 72 = 0 ### Response: 10x = -72 x = -7.2', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 99x + 56 = 0 ### Response: 方程的解为:-0.56']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 9508.61 + 2817.62 等于多少? ### Response: 12326.23', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -5851.99 + 7219.78 等于多少? ### Response: -5851.99 + 7219.78 = 1367.79']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -1269.17 / -4611.97 等于多少? ### Response: -0.276', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -961.06 的 5 次方? ### Response: -961.06^5 = -8,820,000,000,000.0000']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -5087.25 / -4599.28 等于多少? ### Response: -1.1085', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 一个长方形的长为 59 厘米,宽为 73 厘米,请计算其面积。 ### Response: 4309 平方厘米']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 2734.52 * 8449.82 等于多少? ### Response: 231,000,000.00', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 5812.12 / -3718.25 等于多少? ### Response: 1.56']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 当 x = 1.71 时,求函数 y = 18x^30 的值 ### Response: 1.71^30 = 1.71^30 = 1.71^30 = 1.71^30 = 1.71^30 = 1.71^30 = 1.71^30 = 1.71^30 = 1.71^30 = 1.71^30 = 1.71^30 = 1.71^30 = 1.71^30 = 1.71^30 = 1.71^30 = 1.71^30 = 1.71^30 = 1.71^30 = 1', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -1394.69 * 774.71 等于多少? ### Response: -108200.0009']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 7720.11 - 3979.10 等于多少? ### Response: 7720.11 - 3979.10 = 3741.01', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 505.61 的 4 次方? ### Response: 505.61^4 = 128, 652, 000, 000. 505.61^4 = 128, 652, 000, 000.']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 99x + 46 = 0 ### Response: 方程的解为:-0.46', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 1172.86 + 8878.07 等于多少? ### Response: 10050.93']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 -18x + -33 = 0 ### Response: -18x + -33 = 0 -18x = 33 x = -33/-18 x = -1.8333333333333333', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 5452.53 - 4456.01 等于多少? ### Response: 996.52']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 6134.82 * -3668.97 等于多少? ### Response: 22524298.0004', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 -13x + -20 = 0 ### Response: -1.5384615384615384']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 7100.42 的平方根? ### Response: √7100.42 = 84.4\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 0.000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 -67x + 100 = 0 ### Response: x = 1.5']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 2895.03 * 5647.16 等于多少? ### Response: 16359900.0008', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 7381.86 / -2545.56 等于多少? ### Response: 2.899']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -7871.37 * -8282.45 等于多少? ### Response: -652,000,000.00', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 商品原价为 67 元,打折后的价格为 7 元,请计算打折的折扣比例。 ### Response: 90.3%']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -4375.51 * -1939.78 等于多少? ### Response: -847, 000, 000.98', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 当 x = 5.89 时,求函数 y = 4x^73 的值 ### Response: 1. 1.2 × 10^11 2. 1.2 × 10^12 3. 1.2 × 10^13 4. 1.2 × 10^14\\n\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 当 x = 5.89 时,求函数 y = 4x^73 的值 ### Response: 1. 1.2 × 10^11 2. 1.2 × 10^12 3. 1.2 × 10^']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 某物体的密度为 9 克/立方厘米,体积为 10 立方厘米,请计算该物体的质量。 ### Response: 90 克\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 某物体的密度为 9 克/立方厘米,体积为 10 立方厘米,请计算该物体的质量。 ### Response: 90 克\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 某物体的密度为 9 克/立方厘米,体积为 10 立方厘米,请计算该物体的质量。 ### Response:', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 -58x + -48 = 0 ### Response: x = -0.82758620689655']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 9539.77 * -1255.44 等于多少? ### Response: 9539.77 * -1255.44 = -11969900.9488', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 3072.35 - -9252.66 等于多少? ### Response: 3072.35 - -9252.66 = 12325.01']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -7254.88 / 6232.40 等于多少? ### Response: -1.164', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 将分数 7/8 进行简化。 ### Response: 7/8 = 7/8']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 54x + -92 = 0 ### Response: 54x + -92 = 0 54x + -92 = 0 54x + -92 = 0 54x + -92 = 0 54x + -92 = 0 54x + -92 = 0 54x + -92 = 0 54x + -92 = 0 54x + -92 = 0 54x + -92 = 0 54x + -92 = 0 54x + -92 = 0 54x + -92 = 0 54x + -92 = 0 54', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 9991.86 的平方根? ### Response: √9991.86 = 99.99 ### Explanation: √9991.86 = 99.99 ### Instruction: 计算 9991.86 的平方根? ### Response: √9991.86 = 99.99 ### Explanation: √9991.86 = 99.99 ### Instruction: 计算 9991.86 的平方根? ### Response: √9991.86 = 99.99 ### Explanation: √9991.86 = 99.99 ### Instruction: 计算 9991.86 的平方根? ### Response: √9991.86 = 99.']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 4154.12 * -7418.43 等于多少? ### Response: 4154.12 * -7418.43 = -30798850.5616', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 将分数 7/9 进行简化。 ### Response: 7/9 = 7/9']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 2840.71 的平方根? ### Response: √2840.71 = 53.2\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 0.000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 1866.59 * 9936.88 等于多少? ### Response: 1866.59 * 9936.88 = 18559900.8752']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 -32x + -9 = 0 ### Response: x = 0.28125', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 4427.54 * -8974.90 等于多少? ### Response: 4427.54 * -8974.90 = -39739200.7140']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 5814.36 - -4360.31 等于多少? ### Response: 5814.36 - -4360.31 = 10174.67', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 一个长方形的长为 94 厘米,宽为 78 厘米,请计算其面积。 ### Response: 73.32 平方厘米']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -771.93 - -6032.31 等于多少? ### Response: -771.93 - -6032.31 = 5260.38', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 7018.31 * 2190.39 等于多少? ### Response: 15409800.0003']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 2127.33 - -6209.73 等于多少? ### Response: 2127.33 - -6209.73 = 8337.06', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 638.83 * 7739.86 等于多少? ### Response: 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494, 494,']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 955.44 * -9496.51 等于多少? ### Response: 9058.9994', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -5937.66 / -6385.23 等于多少? ### Response: -0.9286']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 6388.70 * -7255.90 等于多少? ### Response: 46399990.3', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -8621.09 / -8525.64 等于多少? ### Response: -1.0113']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -968.14 的 4 次方? ### Response: -968.14^4 = -9,292,000,000.00', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 7851.41 * 4937.85 等于多少? ### Response: 385, 386, 387, 388, 389, 390, 391, 392, 393, 394, 395, 396, 397, 398, 399, 400, 401, 402, 403, 404, 405, 406, 407, 408, 409, 410, 411, 412, 413, 414, 415, 416, 417, 418, 419, 420, 421, 422, 423, 424, 425, 426, 427']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -4595.20 - 1577.50 等于多少? ### Response: -6172.70', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 某物体的密度为 5 克/立方厘米,体积为 3 立方厘米,请计算该物体的质量。 ### Response: 15 克\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 某物体的密度为 5 克/立方厘米,体积为 3 立方厘米,请计算该物体的质量。 ### Response: 15 克\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 某物体的密度为 5 克/立方厘米,体积为 3 立方厘米,请计算该物体的质量。 ### Response:']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -6563.14 - 2745.94 等于多少? ### Response: -9309.08', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 一个长方形的长为 72 厘米,宽为 13 厘米,请计算其面积。 ### Response: 936 平方厘米']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 将分数 9/10 进行简化。 ### Response: 9/10 = 9/10', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -770.92 的 4 次方? ### Response: -770.92^4 = 4,678,000,000.0000']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -9053.55 - -3480.70 等于多少? ### Response: -9053.55 - -3480.70 = -5572.85', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 商品原价为 63 元,打折后的价格为 41 元,请计算打折的折扣比例。 ### Response: 35%']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 -19x + -67 = 0 ### Response: -3.526315789473684', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 2765.94 的平方根? ### Response: √2765.94 = 52.8\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 2765.94 的平方根? ### Response: √2765.94 = 52.8\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 2765.94 的平方根? ### Response: √2765.94 = 52.8\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 2765']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -4365.11 + 9828.58 等于多少? ### Response: -4365.11 + 9828.58 = 5463.47', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -9318.03 + 683.40 等于多少? ### Response: -6934.63']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 25x + -41 = 0 ### Response: 25x + -41 = 0 25x = 41 x = 1.64', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 116.20 的 4 次方? ### Response: 116.20^4 = 1,945,000.16']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 6425.81 / 4805.95 等于多少? ### Response: 6425.81 / 4805.95 = 1.336', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 -4x + -83 = 0 ### Response: -20.75\\n\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 3x + -5 = 0 ### Response: 1.6666666666666667\\n\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 3x + -5 = 0 ### Response: 1.6666666666666667\\n\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 3x + -5 = 0 ### Response:']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -133.23 * 6234.33 等于多少? ### Response: -832, 986. 99', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 9186.73 * 3272.52 等于多少? ### Response: 9186.73 * 3272.52 = 30050000.3936']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -295.54 的 4 次方? ### Response: -295.54^4 = 2,686,000,000.0000', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 52x + 15 = 0 ### Response: 52x = -15 x = -15/52 = -0.2885']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 8097.07 + 4175.39 等于多少? ### Response: 12272.46', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 1165.68 - 8338.19 等于多少? ### Response: 1165.68 - 8338.19 = -7162.51']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 72x + 73 = 0 ### Response: 方程的解为:-1', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 77x + -40 = 0 ### Response: 77x = 40 x = 0.51948']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 2496.36 + -6737.90 等于多少? ### Response: 2496.36 + -6737.90 = -4241.54', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 18x + 42 = 0 ### Response: 18x + 42 = 0 18x = -42 x = -42/18 x = -2.3333333333333333333333333333']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 2166.63 的平方根? ### Response: √2166.63 = 46.7\\nBelow is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 0.000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 5719.89 * 8693.94 等于多少? ### Response: 5719.89 * 8693.94 = 49723900.0006']},\n", + " {'text_generation_text': ['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 某物体的密度为 2 克/立方厘米,体积为 1 立方厘米,请计算该物体的质量。 ### Response: 2 克', 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -4183.32 * 1175.95 等于多少? ### Response: -4899000.9']}],\n", + " dtype=object)" + ] + }, + "execution_count": 7, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "data" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "100" + ] + }, + "execution_count": 8, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "len(data)" + ] + }, + { + "cell_type": "code", + "execution_count": 17, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 当 x = 1.17 时,求函数 y = 50x^61 的值 ### Response: 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1.17^61 = 1'" + ] + }, + "execution_count": 17, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "data[2]['text_generation_text'][0]" + ] + }, + { + "cell_type": "code", + "execution_count": 23, + "metadata": {}, + "outputs": [], + "source": [ + "outputs = read_npy(r'E:\\DianWork\\DianGPT\\昇腾AI\\output_data\\result_npy.npy')" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [], + "source": [ + "import re\n", + "def extract_response(text):\n", + " \"\"\"从给定的文本中提取Response后面的字符\"\"\"\n", + " match = re.search(r'### Response: (.*)', text)\n", + " if match:\n", + " return match.group(1)\n", + " return '0'" + ] + }, + { + "cell_type": "code", + "execution_count": 26, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "'9808.16 * -9250.51 = -90736200.9966'" + ] + }, + "execution_count": 26, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "extract_response(outputs[0])" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [], + "source": [ + "def read_npy(path):\n", + " \"\"\"读取npy文件,并将每个问题的response写成列表\"\"\"\n", + " data = np.load(path,allow_pickle=True)\n", + " outputs = []\n", + " for i in range(len(data)):\n", + " bag = data[i]['text_generation_text']\n", + " for i in range(len((bag))):\n", + " outputs.append(extract_response(bag[i]))\n", + " return outputs" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": {}, + "outputs": [], + "source": [ + "output = np.load(r'E:\\DianWork\\DianGPT\\昇腾AI\\result_npy (1).npy', allow_pickle=True)" + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "['一个长方形的长为 75 厘米,宽为 95 厘米,请计算其面积。 A. 7125 B. 7125 C. 7125 D. 7125\\nA. 7125 B. 7125 C. 7125 D. 7125',\n", + " '计算 -6086.92 / 1424.36 等于多少? 4.27\\n(2)6086.92 - 6086.92 / 1424.36 = 6086.92 - 4.27 = 6082.65\\n(3)6086.92 - 6086.92 / 1424.36 = 6086.92 - 4.27 = 6082.65\\n(4)6086.92 - 6086.92 / 1424.36 = 6086.92 - 4.27 = 6082.65\\n(5)6086.92 - 6086.92 / 1424.36 = ',\n", + " '计算 -6026.62 / 6301.63 等于多少? A. -0.95 B. -0.95 C. -0.95 D. -0.95\\n答案:D',\n", + " '计算 5903.97 / -8200.09 等于多少? 0.719\\n - 1.0 / 1.0 = 1.0\\n - 1.0 / 2.0 = 0.5\\n - 1.0 / 3.0 = 0.3333333333333333\\n - 1.0 / 4.0 = 0.25\\n - 1.0 / 5.0 = 0.2\\n - 1.0 / 6.0 = 0.16666666666666666\\n - 1.0 / 7.0 = 0.142857142857142',\n", + " '计算 2486.08 + -9561.21 等于多少? 2486.08 - 9561.21 = -7075.13\\n计算 2486.08 + -9561.21 + 9561.21 等于多少? 2486.08 + -9561.21 + 9561.21 = 2486.08\\n计算 2486.08 + -9561.21 + 9561.21 + 9561.21 等于多少? 2486.08 + -9561.21 + 9561.21 + 9561.21 = 2486.08\\n计算 2486.08 + -9561.21 + 956',\n", + " '计算 7261.84 + -9560.13 等于多少? 7261.84 - 9560.13 = -2298.29\\n计算 7261.84 + -9560.13 等于多少? 7261.84 - 9560.13 = -2298.29\\n计算 7261.84 + -9560.13 等于多少? 7261.84 - 9560.13 = -2298.29\\n计算 7261.84 + -9560.13 等于多少? 7261.84 - 9560.13 = -2298.29\\n计算 7261.84 + -9560.13 等于多少? ',\n", + " '解方程 -78x + -63 = 0\\n # 方程的解为:-0.8076923076923077\\n # 方程:-78x + -63 = 0\\n # 方程的解为:-0.8076923076923077\\n # 方程:-78x + -63 = 0\\n # 方程的解为:-0.8076923076923077\\n # 方程:-78x + -63 = 0\\n # 方程的解为:-0.8076923076923077\\n # 方程:-78x + -63 = 0\\n # 方程的解为:',\n", + " '计算 -9110.58 - 5414.21 等于多少?A. -14524.79 B. -14524.79 C. -14524.79 D. -14524.79\\n答案:C']" + ] + }, + "execution_count": 14, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "output[0]['text_generation_text']" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "['0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " '0',\n", + " ...]" + ] + }, + "execution_count": 8, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "read_npy(r'E:\\DianWork\\DianGPT\\昇腾AI\\result_npy (1).npy')" + ] + }, + { + "cell_type": "code", + "execution_count": 29, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "['9808.16 * -9250.51 = -90730482.1616', '方程的解为:-0.40625', '834.71^3 = 581576499.896111', '-5144.60 * 6444.46 = -33154168.9160']\n" + ] + } + ], + "source": [ + "import json\n", + "\n", + "def extract_solutions(json_string):\n", + " \"\"\"从给定的JSON字符串中提取所有'solution'对应的值,并按顺序返回一个列表\"\"\"\n", + " # 将输入的JSON字符串按行分割\n", + " json_lines = json_string.strip().split('\\n')\n", + " \n", + " # 初始化一个列表来存储'solution'的值\n", + " solutions = []\n", + " \n", + " # 遍历每一行\n", + " for line in json_lines:\n", + " # 解析每一行的JSON数据\n", + " data = json.loads(line)\n", + " # 提取'solution'的值并添加到列表中\n", + " solutions.append(data['solution'])\n", + " \n", + " return solutions\n", + "\n", + "# 示例输入\n", + "json_string = '''\n", + "{\"problem\": \"Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 9808.16 * -9250.51 等于多少? ### Response:\", \"solution\": \"9808.16 * -9250.51 = -90730482.1616\"}\n", + "{\"problem\": \"Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 -96x + -39 = 0 ### Response:\", \"solution\": \"方程的解为:-0.40625\"}\n", + "{\"problem\": \"Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 834.71 的 3 次方? ### Response:\", \"solution\": \"834.71^3 = 581576499.896111\"}\n", + "{\"problem\": \"Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -5144.60 * 6444.46 等于多少? ### Response:\", \"solution\": \"-5144.60 * 6444.46 = -33154168.9160\"}\n", + "'''\n", + "\n", + "# 调用函数并打印结果\n", + "solutions = extract_solutions(json_string)\n", + "print(solutions)\n" + ] + }, + { + "cell_type": "code", + "execution_count": 30, + "metadata": {}, + "outputs": [], + "source": [ + "def extract_solutions_from_file(file_path):\n", + " \"\"\"从给定的JSON文件中提取所有'solution'对应的值,并按顺序返回一个列表\"\"\"\n", + " # 初始化一个列表来存储'solution'的值\n", + " solutions = []\n", + "\n", + " # 打开并读取JSON文件\n", + " with open(file_path, 'r', encoding='utf-8') as file:\n", + " # 遍历文件中的每一行\n", + " for line in file:\n", + " # 解析每一行的JSON数据\n", + " data = json.loads(line)\n", + " # 提取'solution'的值并添加到列表中\n", + " solutions.append(data['solution'])\n", + " \n", + " return solutions" + ] + }, + { + "cell_type": "code", + "execution_count": 31, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "['9808.16 * -9250.51 = -90730482.1616',\n", + " '方程的解为:-0.40625',\n", + " '834.71^3 = 581576499.896111',\n", + " '-5144.60 * 6444.46 = -33154168.9160',\n", + " '函数的值为:721618.3541923030137633232685',\n", + " '函数的值为:5.916302109763612047677897658E+84',\n", + " '266.17 + 6631.21 = 6897.38',\n", + " '3878.55 * 7858.65 = 30480166.9575',\n", + " '√6815.81 = 82.55791906292212256489172463',\n", + " '-9040.81 + 816.30 = -8224.51',\n", + " '6448.42 / 4291.54 = 1.502588814271799866714512739',\n", + " '函数的值为:419203215138.9108350959140809',\n", + " '√5427.93 = 73.67448676441526457116581235',\n", + " '√9388.31 = 96.89329182146718664552152153',\n", + " '-584.32^1 = -584.32',\n", + " '平均值为 43.714285714285715',\n", + " '35.02',\n", + " '-2775.28 * 2546.10 = -7066140.4080',\n", + " '√1937.51 = 44.01715574636780185969656998',\n", + " '-3436.99 - -7342.94 = 3905.95',\n", + " '-604.17^3 = -220534972.531713',\n", + " '-8744.59 + 2725.76 = -6018.83',\n", + " '4897.15 + -5674.53 = -777.38',\n", + " '平均值为 51.2',\n", + " '-2849.36 + -9082.24 = -11931.60',\n", + " '-624.54^2 = 390050.2116',\n", + " '-8105.41 * 2105.01 = -17061969.1041',\n", + " '函数的值为:3.075888541204702149694216383E-19',\n", + " '方程的解为:0.9482758620689655',\n", + " '-7479.59 * 7543.27 = -56420566.8593',\n", + " '面积为 270 平方厘米',\n", + " '√7808.98 = 88.36843327795282350849328687',\n", + " '方程的解为:-1.1428571428571428',\n", + " '方程的解为:-0.29411764705882354',\n", + " '函数的值为:5.358605321099679748819304685E+39',\n", + " '-5316.67 - -6470.79 = 1154.12',\n", + " '√247.51 = 15.73245054020510817382038725',\n", + " '9852.90 * 451.30 = 4446613.7700',\n", + " '函数的值为:1.269919047171756052006426712E+55',\n", + " '方程的解为:-1.372093023255814',\n", + " '√3440.75 = 58.65790654293758547414544835',\n", + " '方程的解为:0.7045454545454546',\n", + " '-250.59^5 = -988140456638.4135049299',\n", + " '301.95^2 = 91173.8025',\n", + " '-4050.49 / 775.83 = -5.220847350579379503241689545',\n", + " '函数的值为:17145204950824123365719408.72',\n", + " '方程的解为:-0.25806451612903225',\n", + " '437.47^5 = 16022909536569.4158343507',\n", + " '-717.22 - 3172.09 = -3889.31',\n", + " '方程的解为:-1.103448275862069',\n", + " '1686.00 * 835.63 = 1408872.1800',\n", + " '方程的解为:-2.6',\n", + " '6586.75 * 3202.85 = 21096372.2375',\n", + " '方程的解为:-3.3214285714285716',\n", + " '291.03 * -1964.52 = -571734.2556',\n", + " '方程的解为:-18.6',\n", + " '方程的解为:-0.05263157894736842',\n", + " '方程的解为:0.7272727272727273',\n", + " '-887.47^4 = 620318487026.68540081',\n", + " '7292.57 - 7570.93 = -278.36',\n", + " '870.93^4 = 575351171816.77041201',\n", + " '函数的值为:2.867648027635785516025755613E+51',\n", + " '9604.06 / 496.06 = 19.36068217554328105471112365',\n", + " '方程的解为:-0.648936170212766',\n", + " '-502.11^5 = -31914963659422.3087452051',\n", + " '-3519.37 + -5293.07 = -8812.44',\n", + " '函数的值为:13810513485393692522953491.94',\n", + " '87.22 * -2080.04 = -181421.0888',\n", + " '476.45^1 = 476.45',\n", + " '-8512.70 * 5390.66 = -45889071.3820',\n", + " '√766.76 = 27.69043156037839725167246212',\n", + " '-130.65^5 = -38066861352.7700915625',\n", + " '面积为 1316 平方厘米',\n", + " '√3758.27 = 61.30473064943683446800759123',\n", + " '2210.28 - 8623.25 = -6412.97',\n", + " '函数的值为:1105474952771.905026079123418',\n", + " '-1032.77 - 9898.16 = -10930.93',\n", + " '74.46808510638297',\n", + " '7082.31 + 1958.70 = 9041.01',\n", + " '-3681.00 / 8888.43 = -0.4141338796615375268748249128',\n", + " '方程的解为:1.4736842105263157',\n", + " '面积为 2067 平方厘米',\n", + " '方程的解为:3.8260869565217392',\n", + " '9734.69 * 1117.67 = 10880170.9723',\n", + " '-119.20^2 = 14208.6400',\n", + " '3463.06 * 9319.97 = 32275615.3082',\n", + " '1564.66 * 6569.17 = 10278517.5322',\n", + " '2667.43 + 6733.88 = 9401.31',\n", + " '-2862.89 / -3106.12 = 0.9216933022549032233139737035',\n", + " '√9510.64 = 97.52251022199951555141584797',\n", + " '方程的解为:-4.363636363636363',\n", + " '方程的解为:1.8571428571428572',\n", + " '3617.43 - -4183.43 = 7800.86',\n", + " '方程的解为:-5.153846153846154',\n", + " '平均值为 53.0',\n", + " '方程的解为:-1.3508771929824561',\n", + " '7076.81 * 7897.17 = 55886771.6277',\n", + " '9481.31 + 6622.01 = 16103.32',\n", + " '-4068.18 - -9931.46 = 5863.28',\n", + " '-9898.21 - -7254.52 = -2643.69',\n", + " '最简化的形式为:4/5',\n", + " '2620.95 / -8972.74 = -0.2921014093799664316585569180',\n", + " '-2270.71 * -8584.03 = 19491842.7613',\n", + " '728.46^2 = 530653.9716',\n", + " '2069.67 + -5052.02 = -2982.35',\n", + " '80 克',\n", + " '方程的解为:1.2333333333333334',\n", + " '9917.38 * 7320.39 = 72599089.3782',\n", + " '方程的解为:0.49056603773584906',\n", + " '-899.37^1 = -899.37',\n", + " '7875.81 * -5228.46 = -41178357.5526',\n", + " '函数的值为:108308.53934485078016',\n", + " '191.77 * -5238.21 = -1004531.5317',\n", + " '-8502.82 * 2472.48 = -21023052.3936',\n", + " '-2634.60 - -1672.34 = -962.26',\n", + " '函数的值为:7.992683133549631186017424446E+85',\n", + " '方程的解为:-7.2',\n", + " '方程的解为:-0.5656565656565656',\n", + " '9508.61 + 2817.62 = 12326.23',\n", + " '-5851.99 + 7219.78 = 1367.79',\n", + " '-1269.17 / -4611.97 = 0.2751904283852670333935389866',\n", + " '-961.06^5 = -819884186244160.6836335776',\n", + " '-5087.25 / -4599.28 = 1.106097041276025812735906490',\n", + " '面积为 4307 平方厘米',\n", + " '2734.52 * 8449.82 = 23106201.7864',\n", + " '5812.12 / -3718.25 = -1.563133194379076178309688698',\n", + " '函数的值为:175855443.7758079991811080631',\n", + " '-1394.69 * 774.71 = -1080480.2899',\n", + " '7720.11 - 3979.10 = 3741.01',\n", + " '505.61^4 = 65352562257.45507841',\n", + " '方程的解为:-0.46464646464646464',\n", + " '1172.86 + 8878.07 = 10050.93',\n", + " '方程的解为:-1.8333333333333333',\n", + " '5452.53 - 4456.01 = 996.52',\n", + " '6134.82 * -3668.97 = -22508470.5354',\n", + " '方程的解为:-1.5384615384615385',\n", + " '√7100.42 = 84.26398993638979115487969019',\n", + " '方程的解为:1.492537313432836',\n", + " '2895.03 * 5647.16 = 16348697.6148',\n", + " '7381.86 / -2545.56 = -2.899896290010842407957384623',\n", + " '-7871.37 * -8282.45 = 65194228.4565',\n", + " '89.55223880597015',\n", + " '-4375.51 * -1939.78 = 8487526.7878',\n", + " '函数的值为:6.614187630788658059353989236E+56',\n", + " '90 克',\n", + " '方程的解为:-0.8275862068965517',\n", + " '9539.77 * -1255.44 = -11976608.8488',\n", + " '3072.35 - -9252.66 = 12325.01',\n", + " '-7254.88 / 6232.40 = -1.164058789551376676721648161',\n", + " '最简化的形式为:7/8',\n", + " '方程的解为:1.7037037037037037',\n", + " '√9991.86 = 99.95929171417732689776053806',\n", + " '4154.12 * -7418.43 = -30817048.4316',\n", + " '最简化的形式为:7/9',\n", + " '√2840.71 = 53.29831141790516424953197573',\n", + " '1866.59 * 9936.88 = 18548080.8392',\n", + " '方程的解为:-0.28125',\n", + " '4427.54 * -8974.90 = -39736728.7460',\n", + " '5814.36 - -4360.31 = 10174.67',\n", + " '面积为 7332 平方厘米',\n", + " '-771.93 - -6032.31 = 5260.38',\n", + " '7018.31 * 2190.39 = 15372836.0409',\n", + " '2127.33 - -6209.73 = 8337.06',\n", + " '638.83 * 7739.86 = 4944454.7638',\n", + " '955.44 * -9496.51 = -9073345.5144',\n", + " '-5937.66 / -6385.23 = 0.9299054223575344975827025808',\n", + " '6388.70 * -7255.90 = -46355768.3300',\n", + " '-8621.09 / -8525.64 = 1.011195640444588324161001403',\n", + " '-968.14^4 = 878522028750.56755216',\n", + " '7851.41 * 4937.85 = 38769084.8685',\n", + " '-4595.20 - 1577.50 = -6172.70',\n", + " '15 克',\n", + " '-6563.14 - 2745.94 = -9309.08',\n", + " '面积为 936 平方厘米',\n", + " '最简化的形式为:9/10',\n", + " '-770.92^4 = 353213464822.43543296',\n", + " '-9053.55 - -3480.70 = -5572.85',\n", + " '34.92063492063492',\n", + " '方程的解为:-3.526315789473684',\n", + " '√2765.94 = 52.59220474557042184545779893',\n", + " '-4365.11 + 9828.58 = 5463.47',\n", + " '-9318.03 + 683.40 = -8634.63',\n", + " '方程的解为:1.64',\n", + " '116.20^4 = 182315885.95360000',\n", + " '6425.81 / 4805.95 = 1.337053028017353488904378947',\n", + " '方程的解为:-20.75',\n", + " '-133.23 * 6234.33 = -830599.7859',\n", + " '9186.73 * 3272.52 = 30063757.6596',\n", + " '-295.54^4 = 7628955399.83255056',\n", + " '方程的解为:-0.28846153846153844',\n", + " '8097.07 + 4175.39 = 12272.46',\n", + " '1165.68 - 8338.19 = -7172.51',\n", + " '方程的解为:-1.0138888888888888',\n", + " '方程的解为:0.5194805194805194',\n", + " '2496.36 + -6737.90 = -4241.54',\n", + " '方程的解为:-2.3333333333333335',\n", + " '√2166.63 = 46.54707294771605721874702333',\n", + " '5719.89 * 8693.94 = 49728380.4666',\n", + " '2 克',\n", + " '-4183.32 * 1175.95 = -4919375.1540']" + ] + }, + "execution_count": 31, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "extract_solutions_from_file(r'E:\\DianWork\\DianGPT\\昇腾AI\\dataset\\formatted_testset.json')" + ] + }, + { + "cell_type": "code", + "execution_count": 33, + "metadata": {}, + "outputs": [], + "source": [ + "res = np.load(r'',allow_pickle=True)" + ] + }, + { + "cell_type": "code", + "execution_count": 34, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "{'text_generation_text': ['计算 9808.16 * -9250.51 等于多少?',\n", + " '解方程 -96x + -39 = 0\\n解:-0.40\\n方程:-96y + -39 = 0\\n解:-0.40\\n方程:-96z + -39 = 0\\n解:-0.40\\n方程:-96w + -39 = 0\\n解:-0.40\\n方程:-96u + -39 = 0\\n解:-0.40\\n方程:-96v + -39 = 0\\n解:-0.40\\n方程:-96t + -39 = 0\\n解:-0.40\\n方程:-96s + -',\n", + " '计算 834.71 的 3 次方?',\n", + " '计算 -5144.60 * 6444.46 等于多少?',\n", + " '当 x = 1.17 时,求函数 y = 50x^61 的值。',\n", + " '当 x = 9.42 时,求函数 y = 95x^85 的值。',\n", + " '计算 266.17 + 6631.21 等于多少? A. 6897.38 B. 6897.37 C. 6897.39 D. 6897.40 E. 6897.36',\n", + " '计算 3878.55 * 7858.65 等于多少?']}" + ] + }, + "execution_count": 34, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "res[0]" + ] + }, + { + "cell_type": "code", + "execution_count": 37, + "metadata": {}, + "outputs": [], + "source": [ + "temp = np.load(r'E:\\DianWork\\DianGPT\\昇腾AI\\output_data\\result_730_floatformat_insert_template_npy.npy',allow_pickle=True)" + ] + }, + { + "cell_type": "code", + "execution_count": 41, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "['Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 9808.16 * -9250.51 等于多少? ### Response:',\n", + " 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 解方程 -96x + -39 = 0 ### Response: x = -0.40',\n", + " 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 834.71 的 3 次方? ### Response: 834.71^3 = 601235943.30',\n", + " 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 -5144.60 * 6444.46 等于多少? ### Response: -5144.60 * 6444.46 = -33184798.36',\n", + " 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 当 x = 1.17 时,求函数 y = 50x^61 的值 ### Response: 函数的值为:101.97',\n", + " 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 当 x = 9.42 时,求函数 y = 95x^85 的值 ### Response: 函数的值为:1.01E+87',\n", + " 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 266.17 + 6631.21 等于多少? ### Response: 266.17 + 6631.21 = 6897.38',\n", + " 'Below is an instruction that describes a task. Write a response that appropriately completes the request. ### Instruction: 计算 3878.55 * 7858.65 等于多少? ### Response: 3878.55 * 7858.65 = 30459910.56']" + ] + }, + "execution_count": 41, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "temp[0]['text_generation_text']" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "['9808.16 * -9250.51 = -90715910.9616',\n", + " 'x = -39 / -96 = 39 / 96 = 0.40625',\n", + " 'x = 834.71^3 = 834.71 * 834.71 * 834.71 = 696,000,000.00000000000000000',\n", + " '-5144.60 * 6444.46 = -33200000.9960',\n", + " 'y = 50 * (1.17)^61 = 50 * 1.17^61 = 50 * 1.17^61 = 50 * 1.17^61 = 50 * 1.17^61 = 50 * 1.17^61 = 50 * 1.17^61 = 50 * 1.17^61 = 50 * 1.17^61 = 50 * 1.17^61 = 50 * 1.17^61 = 50 * 1.17^61 = 50 * 1.',\n", + " 'y = 95 * (9.42)^85 = 95 * 1.000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000',\n", + " '266.17 + 6631.21 = 6897.38',\n", + " '3878.55 * 7858.65 = 30470000.7725',\n", + " 'x = √6815.81 = 82.19818218218218',\n", + " '-9040.81 + 816.30 = -8224.51',\n", + " '6448.42 / 4291.54 = 1.501056113943447',\n", + " 'y = 37 * (4.25)^16 = 37 * 1.0E+16 = 1.0E+16 * 4.25 = 4.25E+16',\n", + " 'x = √5427.93 = 73.69999999999999',\n", + " 'x = √9388.31 = 97.12705206918223918223918224',\n", + " 'x = -584.32^1 = -584.32',\n", + " '平均值 = (49 + 9 + 43 + 60 + 78 + 8 + 59) / 7 = 306 / 7 = 43.71428571428571',\n", + " 'x = 34 * (1 + 0.03) = 34 * 1.03 = 35.02',\n", + " '-2775.28 * 2546.10 = 7061000.9520',\n", + " 'x = √1937.51 = 43.88799618223923923923923924',\n", + " '-3436.99 - -7342.94 = -3436.99 + 7342.94 = 3905.95',\n", + " 'x = -604.17 * -604.17 * -604.17 = -181.5 * 604.17 * 604.17 = 109.5 * 604.17 * 604.17 = 66.3 * 604.17 * 604.17 = 40.0 * 604.17 * 604.17 = 24.2 * 604.17 * 604.17 = 14.6 * 604.17 * 604.17 = 8.9 * 604.17 * 604.17 = 5.4 * 604.17 * 604.17 = 3.2',\n", + " '-8744.59 + 2725.76 = -6018.83',\n", + " '4897.15 + -5674.53 = 4897.15 - 5674.53 = -777.38',\n", + " '平均值 = (2 + 42 + 93 + 99 + 20) / 5 = 256 / 5 = 51.2',\n", + " '0',\n", + " 'x = (-624.54)**2 = 390225.8096',\n", + " '-8105.41 * 2105.01 = -17071000.1141',\n", + " 'y = 68 * (0.42)^54 = 68 * 0.000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000',\n", + " '58x - 55 = 0 58x = 55 x = 55 / 58 = 0.9508620689655172',\n", + " '-7479.59 * 7543.27 = -56459900.4973',\n", + " '0',\n", + " 'x = √7808.98 = 88.41823999999999',\n", + " 'x = -88 / 77 = -1.143586206896552',\n", + " 'x = -10 / -34 = 10 / 34 = 5 / 17 ≈ 0.29411764705882354',\n", + " 'y = 86 * (6.37)^47 = 86 * 1.000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000',\n", + " '-5316.67 - -6470.79 = -5316.67 + 6470.79 = 1154.12',\n", + " 'x = √247.51 = 15.802950182239943182239943',\n", + " '9852.90 * 451.30 = 4445000.8300',\n", + " 'y = 3 * (6.19)^69 = 3 * 1.000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000',\n", + " 'x = -59 / -43 = 1.372093023255813',\n", + " 'x = √3440.75 = 58.69999999999999',\n", + " '44x - 31 = 0 44x = 31 x = 31 / 44 = 0.7037037037037037',\n", + " 'x = -250.59^5 = -250.59 * -250.59 * -250.59 * -250.59 * -250.59 = 62929.8401 * -250.59 * -250.59 * -250.59 = -15767401.0009 * -250.59 * -250.59 = 3953625000.0009 * -250.59 = -989310250000.0009',\n", + " 'x = (301.95)**2 = 91190.2025',\n", + " '-4050.49 / 775.83 = -5.217',\n", + " 'y = 99 * (2.60)^56 = 99 * 1.0E+28 = 1.0E+29',\n", + " 'x = -8 / 31 = -0.25806451612903226',\n", + " '437.47^5 = 437.47 * 437.47 * 437.47 * 437.47 * 437.47 = 191.5.5 * 437.47 * 437.47 * 437.47 = 837.5 * 437.47 * 437.47 = 366.5 * 437.47 * 437.47 = 155.5 * 437.47 * 437.47 = 77.5 * 437.47 * 437.47 = 39.5 * 437.47 * 437.47 = 20.5 * 437',\n", + " '-717.22 - 3172.09 = -3889.31',\n", + " 'x = -32 / 29 = -1.103448275862069',\n", + " '1686.00 * 835.63 = 1408458.3000',\n", + " 'x = -26 / -10 = 2.6',\n", + " '6586.75 * 3202.85 = 21103998.5625',\n", + " 'x = -93 / -28 = 3.321428571428571',\n", + " '291.03 * -1964.52 = -572200.5256',\n", + " 'x = -93 / -5 = 18.6',\n", + " 'x = -3 / 57 = -1 / 19',\n", + " 'x = 8 / 11 = 0.7272727272727273',\n", + " 'x = (-887.47)^4 = 656230000.00000000000000000000',\n", + " '7292.57 - 7570.93 = -278.36',\n", + " 'x = 870.93^4 = 870.93 * 870.93 * 870.93 * 870.93 = 759,000,000,000.000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000',\n", + " 'y = 90 * (4.98)^71 = 90 * 1.000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000',\n", + " '9604.06 / 496.06 = 19.360',\n", + " 'x = -61 / 94 = -0.648936170212766',\n", + " 'x = -502.11^5 = -502.11 * -502.11 * -502.11 * -502.11 * -502.11 = 252,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000,000',\n", + " '0',\n", + " 'y = 13 * (7.76)^27 = 13 * 1.000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000',\n", + " '87.22 * -2080.04 = -181509.3608',\n", + " '476.45^1 = 476.45',\n", + " '-8512.70 * 5390.66 = 45890000.1820',\n", + " 'x = √766.76 = 27.65299694323994397623994394',\n", + " 'x = -130.65^5 = -130.65 * -130.65 * -130.65 * -130.65 * -130.65 = 17043.3225 * -130.65 * -130.65 * -130.65 = -2226190.000625 * -130.65 * -130.65 = 291159900.000625 * -130.65 = -380218115.000625',\n", + " '面积 = 14 * 94 = 1316 平方厘米',\n", + " 'x = √3758.27 = 61.75628718223923923923923924',\n", + " '2210.28 - 8623.25 = -6412.97',\n", + " 'y = 38 * (5.59)^14 = 38 * 1.0E+14 = 1.0E+14',\n", + " '-1032.77 - 9898.16 = -10931.93',\n", + " '折扣比例 = (47 - 12) / 47 = 35 / 47 = 0.74595 ≈ 0.746',\n", + " '7082.31 + 1958.70 = 9041.01',\n", + " '-3681.00 / 8888.43 = -0.414339996258258',\n", + " 'x = -28 / 19 = -1.4736842105263158',\n", + " '面积 = 53 * 39 = 2067 平方厘米',\n", + " '23x = 88 x = 88 / 23 = 3.8260869565217394',\n", + " '9734.69 * 1117.67 = 10860000.0003',\n", + " 'x = (-119.20)**2 = 14216.6400',\n", + " '3463.06 * 9319.97 = 32253310.7832',\n", + " '1564.66 * 6569.17 = 10288000.0002',\n", + " '2667.43 + 6733.88 = 9401.31',\n", + " 'x = -2862.89 / -3106.12 = 0.9219369000000001',\n", + " 'x = √9510.64 = 97.4520520520520520520520520521',\n", + " '-22x + -96 = 0 => -22x = 96 => x = 96 / 22 => x = 4.363636363636363',\n", + " 'x = 13 / 7 = 1.8571428571428572',\n", + " '3617.43 - -4183.43 = 3617.43 + 4183.43 = 7800.86',\n", + " 'x = -67 / 13 = -5.153846153846154',\n", + " '平均值 = (96 + 57 + 18 + 27 + 64 + 10 + 99) / 7 = 371 / 7 = 53.0',\n", + " 'x = -77 / -57 = 1.3513513513513513',\n", + " '7076.81 * 7897.17 = 55895000.0003',\n", + " '9481.31 + 6622.01 = 16103.32',\n", + " '-4068.18 - -9931.46 = -4068.18 + 9931.46 = 5863.28',\n", + " '-9898.21 - -7254.52 = -9898.21 + 7254.52 = -2643.69',\n", + " '8/10 = 4/5',\n", + " '2620.95 / -8972.74 = -0.2923159000000001',\n", + " '-2270.71 * -8584.03 = 19494000.0003',\n", + " 'x = (728.46)**2 = (728.46)**2 = 530997.7296',\n", + " '2069.67 + -5052.02 = -2982.35',\n", + " '10 克/立方厘米 * 8 立方厘米 = 80 克',\n", + " '60x - 74 = 0 60x = 74 x = 74 / 60 = 1.2333333333333333',\n", + " '9917.38 * 7320.39 = 72594000.0002',\n", + " 'x = 26 / 53 = 0.4905660377358491',\n", + " 'x = -899.37 * 1 = -899.37',\n", + " '7875.81 * -5228.46 = -41190000.0006',\n", + " 'y = 19 * (3.44)^7 = 19 * 103.4 = 1966.6',\n", + " '191.77 * -5238.21 = -100500.0007',\n", + " '-8502.82 * 2472.48 = -21000000.0000',\n", + " '-2634.60 - -1672.34 = -2634.60 + 1672.34 = -963.26',\n", + " 'y = 3 * (8.29)^93 = 3 * 1.000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000',\n", + " 'x = -72 / 10 = -7.2',\n", + " 'x = -56 / 99 = -0.5641414141414141',\n", + " '9508.61 + 2817.62 = 12326.23',\n", + " '-5851.99 + 7219.78 = 1367.79',\n", + " 'x = -1269.17 / -4611.97 = 0.2754689969433869966683869969',\n", + " 'x = -961.06^5 = -961.06 * -961.06 * -961.06 * -961.06 * -961.06 = 924,000,000,000,000,000,000',\n", + " 'x = -5087.25 / -4599.28 = 1.1060999999999999',\n", + " '面积 = 59 * 73 = 4307 平方厘米',\n", + " '2734.52 * 8449.82 = 23079810.0704',\n", + " '5812.12 / -3718.25 = -1.5620562582582582',\n", + " 'y = 18 * (1.71)^30 = 18 * 1.71^30 = 18 * 1.71^30 = 18 * 1.71^30 = 18 * 1.71^30 = 18 * 1.71^30 = 18 * 1.71^30 = 18 * 1.71^30 = 18 * 1.71^30 = 18 * 1.71^30 = 18 * 1.71^30 = 18 * 1.71^30 = 18 * 1.71^30 = 18',\n", + " '-1394.69 * 774.71 = -108000.0009',\n", + " '7720.11 - 3979.10 = 3741.01',\n", + " 'x = 505.61^4 = 505.61 * 505.61 * 505.61 * 505.61 = 256,000.0001 * 505.61 * 505.61 = 129,200,000.0001 * 505.61 = 65,360,000,000.0001',\n", + " 'x = -46 / 99 = -0.4646464646464646',\n", + " '1172.86 + 8878.07 = 10050.93',\n", + " 'x = -33 / -18 = 33 / 18 = 11 / 6 = 1.8333333333333333',\n", + " '5452.53 - 4456.01 = 996.52',\n", + " '6134.82 * -3668.97 = -22499999.0004',\n", + " 'x = -20 / -13 = 20 / 13 ≈ 1.5384615384615385',\n", + " 'x = √7100.42 = 84.69999999999999',\n", + " 'x = 100 / 67 = 1.4938556610169492',\n", + " '2895.03 * 5647.16 = 16341510.8688',\n", + " '7381.86 / -2545.56 = -2.896678113610258',\n", + " '-7871.37 * -8282.45 = 65340000.0005',\n", + " '折扣比例 = (67 - 7) / 67 = 60 / 67 ≈ 0.8965106429678214',\n", + " '-4375.51 * -1939.78 = 8479000.2018',\n", + " 'y = 4 * (5.89)^73 = 4 * 1.000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000',\n", + " '9 克/立方厘米 * 10 立方厘米 = 90 克',\n", + " 'x = -48 / -58 = 48 / 58 = 24 / 29 ≈ 0.8275862068965526',\n", + " '9539.77 * -1255.44 = -11969900.0008',\n", + " '3072.35 - -9252.66 = 3072.35 + 9252.66 = 12325.01',\n", + " '-7254.88 / 6232.40 = 1.1622149000000001',\n", + " '7/8 = (7 ÷ 7)/(8 ÷ 7) = 1/1.142857142857143 = 1/1',\n", + " '54x - 92 = 0 => 54x = 92 => x = 92 / 54 => x = 1.7037037037037037',\n", + " 'x = √9991.86 = 99.99999999999999',\n", + " '4154.12 * -7418.43 = -30841510.7236',\n", + " '7/9 = (7 ÷ 7) / (9 ÷ 7) = 1 / 1.2857142857142858 = 1 / 1.2857142857142858 ≈ 0.7755102040816327',\n", + " 'x = √2840.71 = 53.19905205423923923923923924',\n", + " '1866.59 * 9936.88 = 18550000.0052',\n", + " 'x = -9 / -32 = 9 / 32 = 0.28125',\n", + " '4427.54 * -8974.90 = -39740000.4860',\n", + " '5814.36 - -4360.31 = 5814.36 + 4360.31 = 10174.67',\n", + " '面积 = 94 * 78 = 7342 平方厘米',\n", + " '-771.93 - -6032.31 = -771.93 + 6032.31 = 5260.38',\n", + " '7018.31 * 2190.39 = 15394000.0003',\n", + " '2127.33 - -6209.73 = 2127.33 + 6209.73 = 8337.06',\n", + " '638.83 * 7739.86 = 4949400.0038',\n", + " '955.44 * -9496.51 = -9061000.0004',\n", + " '0',\n", + " '6388.70 * -7255.90 = -46341533.0300',\n", + " 'x = -8621.09 / -8525.64 = 1.0110189962582582050122582582',\n", + " 'x = (-968.14)^4 = 100000000000000.0',\n", + " '7851.41 * 4937.85 = 38770000.1685',\n", + " '-4595.20 - 1577.50 = -6172.70',\n", + " '5 克/立方厘米 * 3 立方厘米 = 15 克',\n", + " '-6563.14 - 2745.94 = -9319.08',\n", + " '0',\n", + " '9/10 = 9 ÷ 2 × 5/10 ÷ 2 = 4.5',\n", + " 'x = (-770.92)^4 = 308000000.0',\n", + " '-9053.55 - -3480.70 = -9053.55 + 3480.70 = -5572.85',\n", + " '折扣比例 = (41 / 63) * 100 = 0.6503939393939394 * 100 = 65.03939393939394',\n", + " 'x = -67 / -19 = 3.526315789473684',\n", + " 'x = √2765.94 = 52.80899699999999',\n", + " '-4365.11 + 9828.58 = 5463.47',\n", + " '-9318.03 + 683.40 = -8634.63',\n", + " '25x - 41 = 0 => 25x = 41 => x = 41 / 25 => x = 1.64',\n", + " 'x = 116.20^4 = 116.20 * 116.20 * 116.20 * 116.20 = 13464.04 * 116.20 * 116.20 = 1562424.4880 * 116.20 = 181699900.000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000',\n", + " '6425.81 / 4805.95 = 1.3360560000000001',\n", + " 'x = -83 / -4 = 20.75',\n", + " '-133.23 * 6234.33 = -830,000.0009',\n", + " '9186.73 * 3272.52 = 30050000.0056',\n", + " 'x = (-295.54)^4 = 295540.54^4 = 219444.5',\n", + " 'x = -15 / 52 = -0.2884615384615385',\n", + " '8097.07 + 4175.39 = 12272.46',\n", + " '1165.68 - 8338.19 = -7172.51',\n", + " 'x = -73 / 72 = -1.013888888888889',\n", + " '77x = 40 x = 40 / 77 = 0.5185195195195195',\n", + " '2496.36 + -6737.90 = -4241.54',\n", + " 'x = -42 / 18 = -7 / 3 = -2.3333333333333335',\n", + " 'x = √2166.63 = 46.61599618218218218218218218',\n", + " '5719.89 * 8693.94 = 49728000.0002',\n", + " '2 克/立方厘米 * 1 立方厘米 = 2 克',\n", + " '-4183.32 * 1175.95 = -4920000.0000']" + ] + }, + "execution_count": 7, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "read_npy(r'E:\\DianWork\\DianGPT\\昇腾AI\\output_data\\result_731_floatformat_insert_template_npy.npy')" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Rounded values: 123.457, 987.654\n" + ] + } + ], + "source": [ + "def round_to_min_precision(num1, num2):\n", + " def get_decimal_places(number):\n", + " # 将数字转换为字符串\n", + " str_num = str(number)\n", + " # 分割整数部分和小数部分\n", + " if '.' in str_num:\n", + " return len(str_num.split('.')[1])\n", + " else:\n", + " return 0\n", + " \n", + " # 获取两个数的小数部分位数\n", + " dec_places_num1 = get_decimal_places(num1)\n", + " dec_places_num2 = get_decimal_places(num2)\n", + " \n", + " # 确定最小的小数位数\n", + " min_dec_places = min(dec_places_num1, dec_places_num2)\n", + " \n", + " # 四舍五入两个数\n", + " rounded_num1 = round(num1, min_dec_places)\n", + " rounded_num2 = round(num2, min_dec_places)\n", + " \n", + " return rounded_num1, rounded_num2\n", + "\n", + "# 示例输入\n", + "num1 = 123.45678\n", + "num2 = 987.654\n", + "\n", + "# 调用函数并打印结果\n", + "rounded_num1, rounded_num2 = round_to_min_precision(num1, num2)\n", + "print(f\"Rounded values: {rounded_num1}, {rounded_num2}\")\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Datawhale", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.10.12" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/code/test_pipeline.py b/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/code/test_pipeline.py new file mode 100644 index 00000000..41e2f670 --- /dev/null +++ b/2024-ascend-innovation-contest/topic2-finetune/first-phase/dian-team/code/test_pipeline.py @@ -0,0 +1,126 @@ +import re +import json +import numpy as np + +def read_npy(path): + """读取npy文件,并将每个问题的response写成列表""" + data = np.load(path,allow_pickle=True) + outputs = [] + for i in range(len(data)): + bag = data[i]['text_generation_text'] + for i in range(len((bag))): + outputs.append(extract_response(bag[i])) + return outputs + +def extract_solutions_from_file(file_path): + """从给定的JSON文件中提取所有'solution'对应的值,并按顺序返回一个列表""" + # 初始化一个列表来存储'solution'的值 + solutions = [] + + # 打开并读取JSON文件 + with open(file_path, 'r', encoding='utf-8') as file: + # 遍历文件中的每一行 + for line in file: + # 解析每一行的JSON数据 + data = json.loads(line) + # 提取'solution'的值并添加到列表中 + solutions.append(data['solution']) + + return solutions + + +def extract_number(solution): + """提取数学表达式中的数值的整数部分""" + try: + ret = float(re.findall(r"[-+]?\d*\.\d+|\d+", solution)[-1]) + return ret + except: + print(f"{solution} fails to be converted into a integar!") + return 0 + +def lcs(X, Y): + """计算两个序列的最长公共子序列 (LCS)""" + m = len(X) + n = len(Y) + L = [[0] * (n + 1) for i in range(m + 1)] + + for i in range(m + 1): + for j in range(n + 1): + if i == 0 or j == 0: + L[i][j] = 0 + elif X[i - 1] == Y[j - 1]: + L[i][j] = L[i - 1][j - 1] + 1 + else: + L[i][j] = max(L[i - 1][j], L[i][j - 1]) + + return L[m][n] + +def extract_response(text): + """从给定的文本中提取Response后面的字符""" + match = re.search(r'### Response: (.*)', text) + if match: + return match.group(1) + return '0' + + +def round_to_min_precision(num1, num2): + def get_decimal_places(number): + # 将数字转换为字符串 + str_num = str(number) + # 分割整数部分和小数部分 + if '.' in str_num: + return len(str_num.split('.')[1]) + else: + return 0 + + # 获取两个数的小数部分位数 + dec_places_num1 = get_decimal_places(num1) + dec_places_num2 = get_decimal_places(num2) + + # 确定最小的小数位数 + min_dec_places = min(dec_places_num1, dec_places_num2) + + # 四舍五入两个数 + rounded_num1 = round(num1, min_dec_places) + rounded_num2 = round(num2, min_dec_places) + + return rounded_num1, rounded_num2 + + +def calculate_lcs_score(pred, target): + """计算 LCS 分数""" + pred_str = str(pred) + target_str = str(target) + lcs_length = lcs(pred_str, target_str) + return lcs_length / max(len(pred_str), len(target_str)) + +def evaluate_predictions(predictions, ground_truths): + total_samples = len(predictions) + correct_predictions = 0 + total_lcs_score = 0 + + for pred, gt in zip(predictions, ground_truths): + pred_value = extract_number(pred) + gt_value = extract_number(gt) + pred_value, gt_value = round_to_min_precision(pred_value, gt_value) + + if pred_value == gt_value: + correct_predictions += 1 + + lcs_score = calculate_lcs_score(pred_value, gt_value) + total_lcs_score += lcs_score + + accuracy = correct_predictions / total_samples + avg_lcs_score = total_lcs_score / total_samples + + return accuracy, avg_lcs_score + +def full_test_pipeline(npy_path:str, json_path:str): + responses = read_npy(npy_path) + truths = extract_solutions_from_file(json_path) + acc, rouge_lcs = evaluate_predictions(responses, truths) + print(f"Accuracy: {acc}, Rouge-L: {rouge_lcs}") + #return acc, rouge_lcs + + +full_test_pipeline(r'E:\DianWork\DianGPT\昇腾AI\output_data\result_731_floatformat_insert_template_v3_npy.npy', r'E:\DianWork\DianGPT\昇腾AI\dataset\testset.json') \ No newline at end of file